Book a Demo!
CoCalc Logo Icon
StoreFeaturesDocsShareSupportNewsAboutPoliciesSign UpSign In
godotengine
GitHub Repository: godotengine/godot
Path: blob/master/modules/raycast/raycast_occlusion_cull.cpp
10277 views
1
/**************************************************************************/
2
/* raycast_occlusion_cull.cpp */
3
/**************************************************************************/
4
/* This file is part of: */
5
/* GODOT ENGINE */
6
/* https://godotengine.org */
7
/**************************************************************************/
8
/* Copyright (c) 2014-present Godot Engine contributors (see AUTHORS.md). */
9
/* Copyright (c) 2007-2014 Juan Linietsky, Ariel Manzur. */
10
/* */
11
/* Permission is hereby granted, free of charge, to any person obtaining */
12
/* a copy of this software and associated documentation files (the */
13
/* "Software"), to deal in the Software without restriction, including */
14
/* without limitation the rights to use, copy, modify, merge, publish, */
15
/* distribute, sublicense, and/or sell copies of the Software, and to */
16
/* permit persons to whom the Software is furnished to do so, subject to */
17
/* the following conditions: */
18
/* */
19
/* The above copyright notice and this permission notice shall be */
20
/* included in all copies or substantial portions of the Software. */
21
/* */
22
/* THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, */
23
/* EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF */
24
/* MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. */
25
/* IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY */
26
/* CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, */
27
/* TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE */
28
/* SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE. */
29
/**************************************************************************/
30
31
#include "raycast_occlusion_cull.h"
32
33
#include "core/config/project_settings.h"
34
#include "core/object/worker_thread_pool.h"
35
#include "core/templates/local_vector.h"
36
37
#ifdef __SSE2__
38
#include <pmmintrin.h>
39
#endif
40
41
RaycastOcclusionCull *RaycastOcclusionCull::raycast_singleton = nullptr;
42
43
void RaycastOcclusionCull::RaycastHZBuffer::clear() {
44
HZBuffer::clear();
45
46
if (camera_rays_unaligned_buffer) {
47
memfree(camera_rays_unaligned_buffer);
48
camera_rays_unaligned_buffer = nullptr;
49
camera_rays = nullptr;
50
}
51
camera_ray_masks.clear();
52
camera_rays_tile_count = 0;
53
tile_grid_size = Size2i();
54
}
55
56
void RaycastOcclusionCull::RaycastHZBuffer::resize(const Size2i &p_size) {
57
if (p_size == Size2i()) {
58
clear();
59
return;
60
}
61
62
if (!sizes.is_empty() && p_size == sizes[0]) {
63
return; // Size didn't change
64
}
65
66
HZBuffer::resize(p_size);
67
68
tile_grid_size = Size2i(Math::ceil(p_size.x / (float)TILE_SIZE), Math::ceil(p_size.y / (float)TILE_SIZE));
69
camera_rays_tile_count = tile_grid_size.x * tile_grid_size.y;
70
71
if (camera_rays_unaligned_buffer) {
72
memfree(camera_rays_unaligned_buffer);
73
}
74
75
const int alignment = 64; // Embree requires ray packets to be 64-aligned
76
camera_rays_unaligned_buffer = (uint8_t *)memalloc(camera_rays_tile_count * sizeof(CameraRayTile) + alignment);
77
camera_rays = (CameraRayTile *)(camera_rays_unaligned_buffer + alignment - (((uint64_t)camera_rays_unaligned_buffer) % alignment));
78
79
camera_ray_masks.resize(camera_rays_tile_count * TILE_RAYS);
80
memset(camera_ray_masks.ptr(), ~0, camera_rays_tile_count * TILE_RAYS * sizeof(uint32_t));
81
}
82
83
void RaycastOcclusionCull::RaycastHZBuffer::update_camera_rays(const Transform3D &p_cam_transform, const Vector3 &p_near_bottom_left, const Vector2 &p_near_extents, real_t p_z_far, bool p_cam_orthogonal) {
84
CameraRayThreadData td;
85
td.thread_count = WorkerThreadPool::get_singleton()->get_thread_count();
86
87
td.z_near = -p_near_bottom_left.z;
88
td.z_far = p_z_far * 1.05f;
89
td.camera_pos = p_cam_transform.origin;
90
td.camera_dir = -p_cam_transform.basis.get_column(2);
91
td.camera_orthogonal = p_cam_orthogonal;
92
93
// Calculate the world coordinates of the viewport.
94
td.pixel_corner = p_cam_transform.xform(p_near_bottom_left);
95
Vector3 top_corner_world = p_cam_transform.xform(p_near_bottom_left + Vector3(0, p_near_extents.y, 0));
96
Vector3 right_corner_world = p_cam_transform.xform(p_near_bottom_left + Vector3(p_near_extents.x, 0, 0));
97
98
td.pixel_u_interp = right_corner_world - td.pixel_corner;
99
td.pixel_v_interp = top_corner_world - td.pixel_corner;
100
101
debug_tex_range = td.z_far;
102
103
WorkerThreadPool::GroupID group_task = WorkerThreadPool::get_singleton()->add_template_group_task(this, &RaycastHZBuffer::_camera_rays_threaded, &td, td.thread_count, -1, true, SNAME("RaycastOcclusionCullUpdateCamera"));
104
WorkerThreadPool::get_singleton()->wait_for_group_task_completion(group_task);
105
}
106
107
void RaycastOcclusionCull::RaycastHZBuffer::_camera_rays_threaded(uint32_t p_thread, const CameraRayThreadData *p_data) {
108
uint32_t total_tiles = camera_rays_tile_count;
109
uint32_t total_threads = p_data->thread_count;
110
uint32_t from = p_thread * total_tiles / total_threads;
111
uint32_t to = (p_thread + 1 == total_threads) ? total_tiles : ((p_thread + 1) * total_tiles / total_threads);
112
_generate_camera_rays(p_data, from, to);
113
}
114
115
void RaycastOcclusionCull::RaycastHZBuffer::_generate_camera_rays(const CameraRayThreadData *p_data, int p_from, int p_to) {
116
const Size2i &buffer_size = sizes[0];
117
118
for (int i = p_from; i < p_to; i++) {
119
CameraRayTile &tile = camera_rays[i];
120
int tile_x = (i % tile_grid_size.x) * TILE_SIZE;
121
int tile_y = (i / tile_grid_size.x) * TILE_SIZE;
122
123
for (int j = 0; j < TILE_RAYS; j++) {
124
int x = tile_x + j % TILE_SIZE;
125
int y = tile_y + j / TILE_SIZE;
126
127
float u = (float(x) + 0.5f) / buffer_size.x;
128
float v = (float(y) + 0.5f) / buffer_size.y;
129
Vector3 pixel_pos = p_data->pixel_corner + u * p_data->pixel_u_interp + v * p_data->pixel_v_interp;
130
131
tile.ray.tnear[j] = p_data->z_near;
132
133
Vector3 dir;
134
if (p_data->camera_orthogonal) {
135
dir = p_data->camera_dir;
136
tile.ray.org_x[j] = pixel_pos.x - dir.x * p_data->z_near;
137
tile.ray.org_y[j] = pixel_pos.y - dir.y * p_data->z_near;
138
tile.ray.org_z[j] = pixel_pos.z - dir.z * p_data->z_near;
139
} else {
140
dir = (pixel_pos - p_data->camera_pos).normalized();
141
tile.ray.org_x[j] = p_data->camera_pos.x;
142
tile.ray.org_y[j] = p_data->camera_pos.y;
143
tile.ray.org_z[j] = p_data->camera_pos.z;
144
tile.ray.tnear[j] /= dir.dot(p_data->camera_dir);
145
}
146
147
tile.ray.dir_x[j] = dir.x;
148
tile.ray.dir_y[j] = dir.y;
149
tile.ray.dir_z[j] = dir.z;
150
151
tile.ray.tfar[j] = p_data->z_far;
152
tile.ray.time[j] = 0.0f;
153
154
tile.ray.flags[j] = 0;
155
tile.ray.mask[j] = ~0U;
156
tile.hit.geomID[j] = RTC_INVALID_GEOMETRY_ID;
157
}
158
}
159
}
160
161
void RaycastOcclusionCull::RaycastHZBuffer::sort_rays(const Vector3 &p_camera_dir, bool p_orthogonal) {
162
ERR_FAIL_COND(is_empty());
163
164
Size2i buffer_size = sizes[0];
165
for (int i = 0; i < tile_grid_size.y; i++) {
166
for (int j = 0; j < tile_grid_size.x; j++) {
167
for (int tile_i = 0; tile_i < TILE_SIZE; tile_i++) {
168
for (int tile_j = 0; tile_j < TILE_SIZE; tile_j++) {
169
int x = j * TILE_SIZE + tile_j;
170
int y = i * TILE_SIZE + tile_i;
171
if (x >= buffer_size.x || y >= buffer_size.y) {
172
continue;
173
}
174
int k = tile_i * TILE_SIZE + tile_j;
175
int tile_index = i * tile_grid_size.x + j;
176
177
mips[0][y * buffer_size.x + x] = camera_rays[tile_index].ray.tfar[k];
178
}
179
}
180
}
181
}
182
}
183
184
RaycastOcclusionCull::RaycastHZBuffer::~RaycastHZBuffer() {
185
if (camera_rays_unaligned_buffer) {
186
memfree(camera_rays_unaligned_buffer);
187
}
188
}
189
190
////////////////////////////////////////////////////////
191
192
bool RaycastOcclusionCull::is_occluder(RID p_rid) {
193
return occluder_owner.owns(p_rid);
194
}
195
196
RID RaycastOcclusionCull::occluder_allocate() {
197
return occluder_owner.allocate_rid();
198
}
199
200
void RaycastOcclusionCull::occluder_initialize(RID p_occluder) {
201
Occluder *occluder = memnew(Occluder);
202
occluder_owner.initialize_rid(p_occluder, occluder);
203
}
204
205
void RaycastOcclusionCull::occluder_set_mesh(RID p_occluder, const PackedVector3Array &p_vertices, const PackedInt32Array &p_indices) {
206
Occluder *occluder = occluder_owner.get_or_null(p_occluder);
207
ERR_FAIL_NULL(occluder);
208
209
occluder->vertices = p_vertices;
210
occluder->indices = p_indices;
211
212
for (const InstanceID &E : occluder->users) {
213
RID scenario_rid = E.scenario;
214
RID instance_rid = E.instance;
215
ERR_CONTINUE(!scenarios.has(scenario_rid));
216
Scenario &scenario = scenarios[scenario_rid];
217
ERR_CONTINUE(!scenario.instances.has(instance_rid));
218
219
if (!scenario.dirty_instances.has(instance_rid)) {
220
scenario.dirty_instances.insert(instance_rid);
221
scenario.dirty_instances_array.push_back(instance_rid);
222
}
223
}
224
}
225
226
void RaycastOcclusionCull::free_occluder(RID p_occluder) {
227
Occluder *occluder = occluder_owner.get_or_null(p_occluder);
228
ERR_FAIL_NULL(occluder);
229
memdelete(occluder);
230
occluder_owner.free(p_occluder);
231
}
232
233
////////////////////////////////////////////////////////
234
235
void RaycastOcclusionCull::add_scenario(RID p_scenario) {
236
ERR_FAIL_COND(scenarios.has(p_scenario));
237
scenarios[p_scenario] = Scenario();
238
}
239
240
void RaycastOcclusionCull::remove_scenario(RID p_scenario) {
241
Scenario *scenario = scenarios.getptr(p_scenario);
242
ERR_FAIL_NULL(scenario);
243
scenario->free();
244
scenarios.erase(p_scenario);
245
}
246
247
void RaycastOcclusionCull::scenario_set_instance(RID p_scenario, RID p_instance, RID p_occluder, const Transform3D &p_xform, bool p_enabled) {
248
ERR_FAIL_COND(!scenarios.has(p_scenario));
249
Scenario &scenario = scenarios[p_scenario];
250
251
if (!scenario.instances.has(p_instance)) {
252
scenario.instances[p_instance] = OccluderInstance();
253
}
254
255
OccluderInstance &instance = scenario.instances[p_instance];
256
257
bool changed = false;
258
259
if (instance.removed) {
260
instance.removed = false;
261
scenario.removed_instances.erase(p_instance);
262
changed = true; // It was removed and re-added, we might have missed some changes
263
}
264
265
if (instance.occluder != p_occluder) {
266
Occluder *old_occluder = occluder_owner.get_or_null(instance.occluder);
267
if (old_occluder) {
268
old_occluder->users.erase(InstanceID(p_scenario, p_instance));
269
}
270
271
instance.occluder = p_occluder;
272
273
if (p_occluder.is_valid()) {
274
Occluder *occluder = occluder_owner.get_or_null(p_occluder);
275
ERR_FAIL_NULL(occluder);
276
occluder->users.insert(InstanceID(p_scenario, p_instance));
277
}
278
changed = true;
279
}
280
281
if (instance.xform != p_xform) {
282
scenario.instances[p_instance].xform = p_xform;
283
changed = true;
284
}
285
286
if (instance.enabled != p_enabled) {
287
instance.enabled = p_enabled;
288
scenario.dirty = true; // The scenario needs a scene re-build, but the instance doesn't need update
289
}
290
291
if (changed && !scenario.dirty_instances.has(p_instance)) {
292
scenario.dirty_instances.insert(p_instance);
293
scenario.dirty_instances_array.push_back(p_instance);
294
scenario.dirty = true;
295
}
296
}
297
298
void RaycastOcclusionCull::scenario_remove_instance(RID p_scenario, RID p_instance) {
299
ERR_FAIL_COND(!scenarios.has(p_scenario));
300
Scenario &scenario = scenarios[p_scenario];
301
302
if (scenario.instances.has(p_instance)) {
303
OccluderInstance &instance = scenario.instances[p_instance];
304
305
if (!instance.removed) {
306
Occluder *occluder = occluder_owner.get_or_null(instance.occluder);
307
if (occluder) {
308
occluder->users.erase(InstanceID(p_scenario, p_instance));
309
}
310
311
scenario.removed_instances.push_back(p_instance);
312
instance.removed = true;
313
}
314
}
315
}
316
317
void RaycastOcclusionCull::Scenario::_update_dirty_instance_thread(int p_idx, RID *p_instances) {
318
_update_dirty_instance(p_idx, p_instances);
319
}
320
321
void RaycastOcclusionCull::Scenario::_update_dirty_instance(int p_idx, RID *p_instances) {
322
OccluderInstance *occ_inst = instances.getptr(p_instances[p_idx]);
323
324
if (!occ_inst) {
325
return;
326
}
327
328
Occluder *occ = raycast_singleton->occluder_owner.get_or_null(occ_inst->occluder);
329
330
if (!occ) {
331
return;
332
}
333
334
int vertices_size = occ->vertices.size();
335
336
// Embree requires the last element to be readable by a 16-byte SSE load instruction, so we add padding to be safe.
337
occ_inst->xformed_vertices.resize(3 * vertices_size + 3);
338
339
const Vector3 *read_ptr = occ->vertices.ptr();
340
float *write_ptr = occ_inst->xformed_vertices.ptr();
341
342
if (vertices_size > 1024) {
343
TransformThreadData td;
344
td.xform = occ_inst->xform;
345
td.read = read_ptr;
346
td.write = write_ptr;
347
td.vertex_count = vertices_size;
348
td.thread_count = WorkerThreadPool::get_singleton()->get_thread_count();
349
WorkerThreadPool::GroupID group_task = WorkerThreadPool::get_singleton()->add_template_group_task(this, &Scenario::_transform_vertices_thread, &td, td.thread_count, -1, true, SNAME("RaycastOcclusionCull"));
350
WorkerThreadPool::get_singleton()->wait_for_group_task_completion(group_task);
351
352
} else {
353
_transform_vertices_range(read_ptr, write_ptr, occ_inst->xform, 0, vertices_size);
354
}
355
356
occ_inst->indices.resize(occ->indices.size());
357
memcpy(occ_inst->indices.ptr(), occ->indices.ptr(), occ->indices.size() * sizeof(int32_t));
358
}
359
360
void RaycastOcclusionCull::Scenario::_transform_vertices_thread(uint32_t p_thread, TransformThreadData *p_data) {
361
uint32_t vertex_total = p_data->vertex_count;
362
uint32_t total_threads = p_data->thread_count;
363
uint32_t from = p_thread * vertex_total / total_threads;
364
uint32_t to = (p_thread + 1 == total_threads) ? vertex_total : ((p_thread + 1) * vertex_total / total_threads);
365
_transform_vertices_range(p_data->read, p_data->write, p_data->xform, from, to);
366
}
367
368
void RaycastOcclusionCull::Scenario::_transform_vertices_range(const Vector3 *p_read, float *p_write, const Transform3D &p_xform, int p_from, int p_to) {
369
float *floats_w = p_write + 3 * p_from;
370
for (int i = p_from; i < p_to; i++) {
371
const Vector3 p = p_xform.xform(p_read[i]);
372
floats_w[0] = p.x;
373
floats_w[1] = p.y;
374
floats_w[2] = p.z;
375
floats_w += 3;
376
}
377
}
378
379
void RaycastOcclusionCull::Scenario::free() {
380
if (commit_thread) {
381
if (commit_thread->is_started()) {
382
commit_thread->wait_to_finish();
383
}
384
memdelete(commit_thread);
385
commit_thread = nullptr;
386
}
387
388
for (int i = 0; i < 2; i++) {
389
if (ebr_scene[i]) {
390
rtcReleaseScene(ebr_scene[i]);
391
ebr_scene[i] = nullptr;
392
}
393
}
394
}
395
396
void RaycastOcclusionCull::Scenario::_commit_scene(void *p_ud) {
397
Scenario *scenario = (Scenario *)p_ud;
398
int commit_idx = 1 - (scenario->current_scene_idx);
399
rtcCommitScene(scenario->ebr_scene[commit_idx]);
400
scenario->commit_done = true;
401
}
402
403
void RaycastOcclusionCull::Scenario::update() {
404
ERR_FAIL_NULL(singleton);
405
406
if (commit_thread == nullptr) {
407
commit_thread = memnew(Thread);
408
}
409
410
if (commit_thread->is_started()) {
411
if (commit_done) {
412
commit_thread->wait_to_finish();
413
current_scene_idx = 1 - current_scene_idx;
414
} else {
415
return;
416
}
417
}
418
419
if (!dirty && removed_instances.is_empty() && dirty_instances_array.is_empty()) {
420
return;
421
}
422
423
for (const RID &scenario : removed_instances) {
424
instances.erase(scenario);
425
}
426
427
if (dirty_instances_array.size() / WorkerThreadPool::get_singleton()->get_thread_count() > 128) {
428
// Lots of instances, use per-instance threading
429
WorkerThreadPool::GroupID group_task = WorkerThreadPool::get_singleton()->add_template_group_task(this, &Scenario::_update_dirty_instance_thread, dirty_instances_array.ptr(), dirty_instances_array.size(), -1, true, SNAME("RaycastOcclusionCullUpdate"));
430
WorkerThreadPool::get_singleton()->wait_for_group_task_completion(group_task);
431
432
} else {
433
// Few instances, use threading on the vertex transforms
434
for (unsigned int i = 0; i < dirty_instances_array.size(); i++) {
435
_update_dirty_instance(i, dirty_instances_array.ptr());
436
}
437
}
438
439
dirty_instances.clear();
440
dirty_instances_array.clear();
441
removed_instances.clear();
442
443
if (raycast_singleton->ebr_device == nullptr) {
444
raycast_singleton->_init_embree();
445
}
446
447
int next_scene_idx = 1 - current_scene_idx;
448
RTCScene &next_scene = ebr_scene[next_scene_idx];
449
450
if (next_scene) {
451
rtcReleaseScene(next_scene);
452
}
453
454
next_scene = rtcNewScene(raycast_singleton->ebr_device);
455
rtcSetSceneBuildQuality(next_scene, RTCBuildQuality(raycast_singleton->build_quality));
456
457
for (const KeyValue<RID, OccluderInstance> &E : instances) {
458
const OccluderInstance *occ_inst = &E.value;
459
const Occluder *occ = raycast_singleton->occluder_owner.get_or_null(occ_inst->occluder);
460
461
if (!occ || !occ_inst->enabled) {
462
continue;
463
}
464
465
RTCGeometry geom = rtcNewGeometry(raycast_singleton->ebr_device, RTC_GEOMETRY_TYPE_TRIANGLE);
466
rtcSetSharedGeometryBuffer(geom, RTC_BUFFER_TYPE_VERTEX, 0, RTC_FORMAT_FLOAT3, occ_inst->xformed_vertices.ptr(), 0, sizeof(float) * 3, occ_inst->xformed_vertices.size() / 3);
467
rtcSetSharedGeometryBuffer(geom, RTC_BUFFER_TYPE_INDEX, 0, RTC_FORMAT_UINT3, occ_inst->indices.ptr(), 0, sizeof(uint32_t) * 3, occ_inst->indices.size() / 3);
468
rtcCommitGeometry(geom);
469
rtcAttachGeometry(next_scene, geom);
470
rtcReleaseGeometry(geom);
471
}
472
473
dirty = false;
474
commit_done = false;
475
commit_thread->start(&Scenario::_commit_scene, this);
476
}
477
478
void RaycastOcclusionCull::Scenario::_raycast(uint32_t p_idx, const RaycastThreadData *p_raycast_data) const {
479
RTCRayQueryContext context;
480
rtcInitRayQueryContext(&context);
481
RTCIntersectArguments args;
482
rtcInitIntersectArguments(&args);
483
args.flags = RTC_RAY_QUERY_FLAG_COHERENT;
484
args.context = &context;
485
rtcIntersect16((const int *)&p_raycast_data->masks[p_idx * TILE_RAYS], ebr_scene[current_scene_idx], &p_raycast_data->rays[p_idx], &args);
486
}
487
488
void RaycastOcclusionCull::Scenario::raycast(CameraRayTile *r_rays, const uint32_t *p_valid_masks, uint32_t p_tile_count) const {
489
ERR_FAIL_NULL(singleton);
490
if (raycast_singleton->ebr_device == nullptr) {
491
return; // Embree is initialized on demand when there is some scenario with occluders in it.
492
}
493
494
if (ebr_scene[current_scene_idx] == nullptr) {
495
return;
496
}
497
498
RaycastThreadData td;
499
td.rays = r_rays;
500
td.masks = p_valid_masks;
501
502
WorkerThreadPool::GroupID group_task = WorkerThreadPool::get_singleton()->add_template_group_task(this, &Scenario::_raycast, &td, p_tile_count, -1, true, SNAME("RaycastOcclusionCullRaycast"));
503
WorkerThreadPool::get_singleton()->wait_for_group_task_completion(group_task);
504
}
505
506
////////////////////////////////////////////////////////
507
508
void RaycastOcclusionCull::add_buffer(RID p_buffer) {
509
ERR_FAIL_COND(buffers.has(p_buffer));
510
buffers[p_buffer] = RaycastHZBuffer();
511
}
512
513
void RaycastOcclusionCull::remove_buffer(RID p_buffer) {
514
ERR_FAIL_COND(!buffers.has(p_buffer));
515
buffers.erase(p_buffer);
516
}
517
518
void RaycastOcclusionCull::buffer_set_scenario(RID p_buffer, RID p_scenario) {
519
ERR_FAIL_COND(!buffers.has(p_buffer));
520
ERR_FAIL_COND(p_scenario.is_valid() && !scenarios.has(p_scenario));
521
buffers[p_buffer].scenario_rid = p_scenario;
522
}
523
524
void RaycastOcclusionCull::buffer_set_size(RID p_buffer, const Vector2i &p_size) {
525
ERR_FAIL_COND(!buffers.has(p_buffer));
526
buffers[p_buffer].resize(p_size);
527
}
528
529
Vector2 RaycastOcclusionCull::_get_jitter(const Rect2 &p_viewport_rect, const Size2i &p_buffer_size) {
530
if (!_jitter_enabled) {
531
return Vector2();
532
}
533
534
// Prevent divide by zero when using NULL viewport.
535
if ((p_buffer_size.x <= 0) || (p_buffer_size.y <= 0)) {
536
return Vector2();
537
}
538
539
int32_t frame = Engine::get_singleton()->get_frames_drawn();
540
frame %= 9;
541
542
Vector2 jitter;
543
544
switch (frame) {
545
default:
546
break;
547
case 1: {
548
jitter = Vector2(-1, -1);
549
} break;
550
case 2: {
551
jitter = Vector2(1, -1);
552
} break;
553
case 3: {
554
jitter = Vector2(-1, 1);
555
} break;
556
case 4: {
557
jitter = Vector2(1, 1);
558
} break;
559
case 5: {
560
jitter = Vector2(-0.5f, -0.5f);
561
} break;
562
case 6: {
563
jitter = Vector2(0.5f, -0.5f);
564
} break;
565
case 7: {
566
jitter = Vector2(-0.5f, 0.5f);
567
} break;
568
case 8: {
569
jitter = Vector2(0.5f, 0.5f);
570
} break;
571
}
572
Vector2 half_extents = p_viewport_rect.get_size() * 0.5;
573
jitter *= Vector2(half_extents.x / (float)p_buffer_size.x, half_extents.y / (float)p_buffer_size.y);
574
575
// The multiplier here determines the jitter magnitude in pixels.
576
// It seems like a value of 0.66 matches well the above jittering pattern as it generates subpixel samples at 0, 1/3 and 2/3
577
// Higher magnitude gives fewer false hidden, but more false shown.
578
// False hidden is obvious to viewer, false shown is not.
579
// False shown can lower percentage that are occluded, and therefore performance.
580
jitter *= 0.66f;
581
582
return jitter;
583
}
584
585
Rect2 _get_viewport_rect(const Projection &p_cam_projection) {
586
// NOTE: This assumes a rectangular projection plane, i.e. that:
587
// - the matrix is a projection across z-axis (i.e. is invertible and columns[0][1], [0][3], [1][0] and [1][3] == 0)
588
// - the projection plane is rectangular (i.e. columns[0][2] and [1][2] == 0 if columns[2][3] != 0)
589
Size2 half_extents = p_cam_projection.get_viewport_half_extents();
590
Point2 bottom_left = -half_extents * Vector2(p_cam_projection.columns[3][0] * p_cam_projection.columns[3][3] + p_cam_projection.columns[2][0] * p_cam_projection.columns[2][3] + 1, p_cam_projection.columns[3][1] * p_cam_projection.columns[3][3] + p_cam_projection.columns[2][1] * p_cam_projection.columns[2][3] + 1);
591
return Rect2(bottom_left, 2 * half_extents);
592
}
593
594
void RaycastOcclusionCull::buffer_update(RID p_buffer, const Transform3D &p_cam_transform, const Projection &p_cam_projection, bool p_cam_orthogonal) {
595
if (!buffers.has(p_buffer)) {
596
return;
597
}
598
599
RaycastHZBuffer &buffer = buffers[p_buffer];
600
601
if (buffer.is_empty() || !scenarios.has(buffer.scenario_rid)) {
602
return;
603
}
604
605
Scenario &scenario = scenarios[buffer.scenario_rid];
606
scenario.update();
607
608
Rect2 vp_rect = _get_viewport_rect(p_cam_projection);
609
Vector2 bottom_left = vp_rect.position;
610
bottom_left += _get_jitter(vp_rect, buffer.get_occlusion_buffer_size());
611
Vector3 near_bottom_left = Vector3(bottom_left.x, bottom_left.y, -p_cam_projection.get_z_near());
612
613
buffer.update_camera_rays(p_cam_transform, near_bottom_left, vp_rect.get_size(), p_cam_projection.get_z_far(), p_cam_orthogonal);
614
615
scenario.raycast(buffer.camera_rays, buffer.camera_ray_masks.ptr(), buffer.camera_rays_tile_count);
616
buffer.sort_rays(-p_cam_transform.basis.get_column(2), p_cam_orthogonal);
617
buffer.update_mips();
618
}
619
620
RaycastOcclusionCull::HZBuffer *RaycastOcclusionCull::buffer_get_ptr(RID p_buffer) {
621
if (!buffers.has(p_buffer)) {
622
return nullptr;
623
}
624
return &buffers[p_buffer];
625
}
626
627
RID RaycastOcclusionCull::buffer_get_debug_texture(RID p_buffer) {
628
ERR_FAIL_COND_V(!buffers.has(p_buffer), RID());
629
return buffers[p_buffer].get_debug_texture();
630
}
631
632
////////////////////////////////////////////////////////
633
634
void RaycastOcclusionCull::set_build_quality(RS::ViewportOcclusionCullingBuildQuality p_quality) {
635
if (build_quality == p_quality) {
636
return;
637
}
638
639
build_quality = p_quality;
640
641
for (KeyValue<RID, Scenario> &K : scenarios) {
642
K.value.dirty = true;
643
}
644
}
645
646
void RaycastOcclusionCull::_init_embree() {
647
#ifdef __SSE2__
648
_MM_SET_FLUSH_ZERO_MODE(_MM_FLUSH_ZERO_ON);
649
_MM_SET_DENORMALS_ZERO_MODE(_MM_DENORMALS_ZERO_ON);
650
#endif
651
652
String settings = vformat("threads=%d", MAX(1, OS::get_singleton()->get_processor_count() - 2));
653
ebr_device = rtcNewDevice(settings.utf8().ptr());
654
}
655
656
RaycastOcclusionCull::RaycastOcclusionCull() {
657
raycast_singleton = this;
658
int default_quality = GLOBAL_GET("rendering/occlusion_culling/bvh_build_quality");
659
_jitter_enabled = GLOBAL_GET("rendering/occlusion_culling/jitter_projection");
660
build_quality = RS::ViewportOcclusionCullingBuildQuality(default_quality);
661
}
662
663
RaycastOcclusionCull::~RaycastOcclusionCull() {
664
for (KeyValue<RID, Scenario> &K : scenarios) {
665
K.value.free();
666
}
667
668
if (ebr_device != nullptr) {
669
rtcReleaseDevice(ebr_device);
670
}
671
672
raycast_singleton = nullptr;
673
}
674
675