-
Notifications
You must be signed in to change notification settings - Fork 1
/
main.c
1042 lines (922 loc) · 28.1 KB
/
main.c
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
402
403
404
405
406
407
408
409
410
411
412
413
414
415
416
417
418
419
420
421
422
423
424
425
426
427
428
429
430
431
432
433
434
435
436
437
438
439
440
441
442
443
444
445
446
447
448
449
450
451
452
453
454
455
456
457
458
459
460
461
462
463
464
465
466
467
468
469
470
471
472
473
474
475
476
477
478
479
480
481
482
483
484
485
486
487
488
489
490
491
492
493
494
495
496
497
498
499
500
501
502
503
504
505
506
507
508
509
510
511
512
513
514
515
516
517
518
519
520
521
522
523
524
525
526
527
528
529
530
531
532
533
534
535
536
537
538
539
540
541
542
543
544
545
546
547
548
549
550
551
552
553
554
555
556
557
558
559
560
561
562
563
564
565
566
567
568
569
570
571
572
573
574
575
576
577
578
579
580
581
582
583
584
585
586
587
588
589
590
591
592
593
594
595
596
597
598
599
600
601
602
603
604
605
606
607
608
609
610
611
612
613
614
615
616
617
618
619
620
621
622
623
624
625
626
627
628
629
630
631
632
633
634
635
636
637
638
639
640
641
642
643
644
645
646
647
648
649
650
651
652
653
654
655
656
657
658
659
660
661
662
663
664
665
666
667
668
669
670
671
672
673
674
675
676
677
678
679
680
681
682
683
684
685
686
687
688
689
690
691
692
693
694
695
696
697
698
699
700
701
702
703
704
705
706
707
708
709
710
711
712
713
714
715
716
717
718
719
720
721
722
723
724
725
726
727
728
729
730
731
732
733
734
735
736
737
738
739
740
741
742
743
744
745
746
747
748
749
750
751
752
753
754
755
756
757
758
759
760
761
762
763
764
765
766
767
768
769
770
771
772
773
774
775
776
777
778
779
780
781
782
783
784
785
786
787
788
789
790
791
792
793
794
795
796
797
798
799
800
801
802
803
804
805
806
807
808
809
810
811
812
813
814
815
816
817
818
819
820
821
822
823
824
825
826
827
828
829
830
831
832
833
834
835
836
837
838
839
840
841
842
843
844
845
846
847
848
849
850
851
852
853
854
855
856
857
858
859
860
861
862
863
864
865
866
867
868
869
870
871
872
873
874
875
876
877
878
879
880
881
882
883
884
885
886
887
888
889
890
891
892
893
894
895
896
897
898
899
900
901
902
903
904
905
906
907
908
909
910
911
912
913
914
915
916
917
918
919
920
921
922
923
924
925
926
927
928
929
930
931
932
933
934
935
936
937
938
939
940
941
942
943
944
945
946
947
948
949
950
951
952
953
954
955
956
957
958
959
960
961
962
963
964
965
966
967
968
969
970
971
972
973
974
975
976
977
978
979
980
981
982
983
984
985
986
987
988
989
990
991
992
993
994
995
996
997
998
999
1000
#include <assert.h>
#include <float.h>
#include <stdbool.h>
#include <stdint.h>
#include <stdio.h>
#include <stdlib.h>
#include <string.h>
#include <errno.h>
#include <unistd.h>
#include <math.h>
#include "misc/vec2.h"
#include "misc/color.h"
#include "misc/debug.h"
#include "misc/file.h"
#include "misc/rng.h"
#include "misc/terminal.h"
#include "misc/time.h"
#include "misc/util.h"
// simulation size
enum {
X = 100,
Y = 40
};
// display size
int g_wx;
int g_wy;
enum {
// P-cells are the outermost cell type, though the boundary
// cells are always fluid sinks.
P_X = X,
P_Y = Y,
// U-cell samples lie between horizontal pairs of P-cells,
// so there's one fewer U-cell sample in X direction.
U_X = X-1,
U_Y = Y,
// V-cell samples lie between vertical pairs of P-cells,
// so there's one fewer V-cell sample in the Y direction.
V_X = X,
V_Y = Y-1
};
typedef enum celltype_t {
P,
U,
V
} celltype_t;
typedef struct args_t {
const char* scenario_file;
bool rainbow;
} args_t;
// simulation constants
const float k_side_length = 1.f; // grid cell size (m)
const float k_density = 1.f; // density in 2D (kg/m²)
const float k_gravity = -10.f; // acceleration (m/s²)
// All arrays are the same size so functions like bilinear interpolation can
// work on any array. The real size is smaller and is listed in the comments.
float g_u[Y][X]; // [Y][X-1] aka [U_Y][U_X]
float g_v[Y][X]; // [Y-1][X] aka [V_Y][V_X]
float g_utmp[Y][X]; // [Y][X-1] aka [U_Y][U_X]
float g_vtmp[Y][X]; // [Y-1][X] aka [V_Y][V_X]
// grid cell properties from the scenario file
// uint8_t used as a compact bool
uint8_t g_solid[Y][X];
uint8_t g_source[Y][X];
uint8_t g_sink[Y][X];
// color data
bool g_rainbow_enabled;
float g_r[Y][X];
float g_g[Y][X];
float g_b[Y][X];
float g_rtmp[Y][X];
float g_gtmp[Y][X];
float g_btmp[Y][X];
const float k_source_color_period = 10.f; // seconds
const float k_initial_color_period = 60.f; // grid cells
// simulation progress
bool g_pause;
uint32_t g_temp_unpause_counter;
uint16_t g_frame_count;
// marker particle data
#define MAX_MARKER_COUNT (4*Y*X)
size_t g_markers_length;
bool g_source_exhausted;
vec2f g_markers[MAX_MARKER_COUNT];
uint8_t g_marker_count[Y][X];
uint8_t g_prev_marker_count[Y][X];
// alternate names
#define g_fluid g_marker_count
#define g_prev_fluid g_prev_marker_count
void refresh_marker_counts() {
memcpy(g_prev_marker_count, g_marker_count, sizeof(g_marker_count));
memset(g_marker_count, 0, sizeof(g_marker_count));
for (size_t i = 0; i < g_markers_length; ++i) {
int x = (int)floorf(g_markers[i].x / k_side_length);
int y = (int)floorf(g_markers[i].y / k_side_length);
assert(x > 0 && x < (int)X && y > 0 && y < (int)Y);
if (g_sink[y][x] || g_solid[y][x]) {
// todo: stop moving markers into solid objects
// remove marker by swapping with back and resizing
g_markers[i--] = g_markers[--g_markers_length];
} else {
g_marker_count[y][x]++;
}
}
}
bool p_property(uint8_t p_value[Y][X], vec2i pidx) {
assert(pidx.x >= 0 && pidx.x < X && pidx.y >= 0 && pidx.y < Y);
return p_value[pidx.y][pidx.x] != 0;
}
bool is_fluid(int y, int x) {
return p_property(g_fluid, v2i(x,y));
}
bool u_property(uint8_t p_value[Y][X], vec2i uidx) {
vec2i left = { uidx.x, uidx.y };
vec2i right = { uidx.x + 1, uidx.y };
return p_property(p_value, left) | p_property(p_value, right);
}
bool v_property(uint8_t p_value[Y][X], vec2i vidx) {
vec2i bottom = { vidx.x, vidx.y };
vec2i top = { vidx.x, vidx.y + 1 };
return p_property(p_value, bottom) | p_property(p_value, top);
}
bool property(uint8_t p_value[Y][X], vec2i idx, celltype_t type) {
switch (type) {
default: assert(false);
case P: return p_property(p_value, idx);
case U: return u_property(p_value, idx);
case V: return v_property(p_value, idx);
}
}
vec2i grid_size(celltype_t type) {
switch (type) {
default: assert(false);
case P: return v2i(P_X, P_Y);
case U: return v2i(U_X, U_Y);
case V: return v2i(V_X, V_Y);
}
}
float valid_neighbor_average(float q[Y][X], vec2i lower, vec2i upper, celltype_t type) {
float total = 0.f;
int count = 0;
for (int y = lower.y; y <= upper.y; ++y) {
for (int x = lower.x; x <= upper.x; ++x) {
if (property(g_prev_fluid, v2i(x,y), type)) {
total += q[y][x];
count++;
}
}
}
assert(count > 0);
return total / count;
}
void extrapolate(float q[Y][X], celltype_t type) {
vec2i size = grid_size(type);
for (int y = 0; y < size.y; ++y) {
for (int x = 0; x < size.x; ++x) {
vec2i i = { x, y };
if (!property(g_prev_fluid, i, type) && property(g_fluid, i, type)) {
vec2i lower = v2i(max_i(x-1, 0), max_i(y-1, 0));
vec2i upper = v2i(min_i(x+1, size.x-1), min_i(y+1, size.y-1));
q[y][x] = valid_neighbor_average(q, lower, upper, type);
}
}
}
}
void colorize() {
for (int y = 0; y < Y; ++y) {
for (int x = 0; x < X; ++x) {
if (p_property(g_fluid, v2i(x,y))) {
float t = 0.f;
if (!g_source[y][x]) {
t = (x + y) * 6.f / k_initial_color_period;
}
g_r[y][x] = hsv_basis(t + 2.f);
g_g[y][x] = hsv_basis(t);
g_b[y][x] = hsv_basis(t - 2.f);
}
}
}
}
float randf() {
static uint64_t rng_state = 0x9bd185c449534b91;
uint32_t x = xorshift64_32star(&rng_state);
return (float)(x / (double)UINT32_MAX);
}
void sim_init(args_t in) {
int length;
char* contents = load_file(in.scenario_file, &length);
if (!contents) {
fprintf(stderr, "Could not load %s!\n", in.scenario_file);
exit(1);
}
// parse the scenario file to init our fluid
int i = 0;
uint8_t fluid[Y][X] = {};
for (int y = Y-2; y > 0 && i < length; --y) {
int x;
for (x = 1; x < X-1 && i < length; ++x) {
char c = contents[i++];
if (c == '\n') {
break;
} else if (c == 'X') {
g_solid[y][x] = true;
} else if (c == '0') {
fluid[y][x] = true;
} else if (c == '?') {
fluid[y][x] = true;
g_source[y][x] = true;
} else if (c == '=') {
g_sink[y][x] = true;
}
}
// discard anything beyond the simulation width
if (x == X-1) {
while (i < length && contents[i++] != '\n');
}
}
release_file(contents);
// add sinks around the outside so we have fewer edge cases
for (int y = 0; y < Y; ++y) {
g_sink[y][0] = true;
g_sink[y][X-1] = true;
}
for (int x = 0; x < X; ++x) {
g_sink[0][x] = true;
g_sink[Y-1][x] = true;
}
// setup fluid markers, 4 per cell, jittered
size_t idx = 0;
for (int i = 0; i < X; ++i) {
for (int j = 0; j < Y; ++j) {
if (fluid[j][i]) {
for (int k = 0; k < 4; ++k) {
float x = i + (k < 2 ? 0 : 0.5f) + (randf()/2);
float y = j + (k % 2 ? 0 : 0.5f) + (randf()/2);
g_markers[idx++] = v2f_mulf(k_side_length, v2f(x,y));
}
}
}
}
g_markers_length = idx;
refresh_marker_counts();
// setup color
if (g_rainbow_enabled) {
colorize();
}
}
void update_fluid_sources() {
// If we ever hit the max number of markers, that's it for adding fluid.
// The current extrapolation implementation assumes that the fluid is never
// more than one cell from a cell where fluid was in the previous step. If
// we stop and then later restart generating fluid, that may not hold true.
g_source_exhausted |= (g_markers_length == MAX_MARKER_COUNT-1);
float t = 0.6f / k_source_color_period * g_frame_count;
for (int y = 0; y < Y; ++y) {
for (int x = 0; x < X; ++x) {
if (g_source[y][x]) {
if (!g_source_exhausted && g_marker_count[y][x] < 4) {
g_markers[g_markers_length++] = v2f_mulf(k_side_length, v2f(x+randf(), y+randf()));
g_marker_count[y][x]++;
g_source_exhausted |= (g_markers_length == MAX_MARKER_COUNT-1);
}
g_r[y][x] = hsv_basis(t + 2.f);
g_g[y][x] = hsv_basis(t);
g_b[y][x] = hsv_basis(t - 2.f);
}
}
}
}
// result unspecified if both start and end are invalid
float get_fraction(float fraction, bool start_valid, bool end_valid) {
if (!start_valid) {
return 1.f;
} else if (!end_valid) {
return 0.f;
} else {
return fraction;
}
}
float linear(float x0, float x1, float frac) {
return (1.f - frac)*x0 + frac*x1;
}
// This method of handling missing data in interpolation gives different
// results depending on whether you interpolated horizontally first or
// vertically first, which is not a good sign for correctness.
float bilinear(float q[2][2], vec2f frac, bool valid[2][2]) {
assert(valid[0][0] | valid[0][1] | valid[1][0] | valid[1][1]);
// one fraction may be wrong if all values on one side are invalid,
// but the resulting value will be ignored in the vertical interpolation
float left_frac = get_fraction(frac.y, valid[0][0], valid[1][0]);
float right_frac = get_fraction(frac.y, valid[0][1], valid[1][1]);
float left_value = linear(q[0][0], q[1][0], left_frac);
float right_value = linear(q[0][1], q[1][1], right_frac);
float horz_frac = get_fraction(frac.x, valid[0][0] | valid[1][0],
valid[0][1] | valid[1][1]);
return linear(left_value, right_value, horz_frac);
}
float sparse_get(float q[Y][X], vec2i idx, bool valid) {
return valid ? q[idx.y][idx.x] : 0.f;
}
float interpolate(float q[Y][X], vec2f idx, celltype_t type) {
vec2i size = grid_size(type);
idx.x = clampf(0, idx.x, nextafterf(size.x-1, 0));
idx.y = clampf(0, idx.y, nextafterf(size.y-1, 0));
vec2f whole;
vec2f frac = modf2f(idx, &whole);
vec2i base_idx = v2i_trunc(whole);
// using bilinear interpolation between the 4 surrounding points,
// excluding any points outside the fluid
bool valid[2][2] = {
{ property(g_fluid, base_idx, type),
property(g_fluid, right(base_idx), type) },
{ property(g_fluid, up(base_idx), type),
property(g_fluid, up(right(base_idx)), type) }
};
// todo: only use bilinear interpolation when all 4 points are valid
// use barycentric coordinates when only 3 points are valid
// use linear interpolation when only 2 points are valid
float qlocal[2][2] = {
{ sparse_get(q, base_idx, valid[0][0]),
sparse_get(q, right(base_idx), valid[0][1]) },
{ sparse_get(q, up(base_idx), valid[1][0]),
sparse_get(q, up(right(base_idx)), valid[1][1]) }
};
return bilinear(qlocal, frac, valid);
}
float interpolate_u(float u[Y][X], vec2f uidx) {
return interpolate(u, uidx, U);
}
float interpolate_v(float v[Y][X], vec2f vidx) {
return interpolate(v, vidx, V);
}
float interpolate_p(float q[Y][X], vec2f pidx) {
return interpolate(q, pidx, P);
}
vec2f vidx_from_u(vec2i uidx) {
return (vec2f){ uidx.x + 0.5f, uidx.y - 0.5f };
}
void advect_u(float u[Y][X], float v[Y][X], float dt, float out[Y][X]) {
for (int y = 0; y < U_Y; ++y) {
for (int x = 0; x < U_X; ++x) {
vec2i uidx = { x, y };
if (u_property(g_fluid, uidx)) {
// find the velocity at the sample point
float dx = u[y][x];
float dy = interpolate_v(v, vidx_from_u(uidx));
// extrapolate backwards through time to find
// where the fluid came from
vec2f prev = { x - dx*dt / k_side_length,
y - dy*dt / k_side_length };
// take the value from there and put it here
out[y][x] = interpolate_u(u, prev);
}
}
}
}
vec2f uidx_from_v(vec2i vidx) {
return (vec2f){ vidx.x - 0.5f, vidx.y + 0.5f };
}
void advect_v(float u[Y][X], float v[Y][X], float dt, float out[Y][X]) {
for (int y = 0; y < V_Y; ++y) {
for (int x = 0; x < V_X; ++x) {
vec2i vidx = { x, y };
if (v_property(g_fluid, vidx)) {
// find the velocity at the sample point
float dy = v[y][x];
float dx = interpolate_u(u, uidx_from_v(vidx));
// extrapolate backwards through time to find
// where the fluid came from
vec2f prev = { x - dx*dt / k_side_length,
y - dy*dt / k_side_length };
// take the value from there and put it here
out[y][x] = interpolate_v(v, prev);
}
}
}
}
void advect_p(float q[Y][X], float u[Y][X], float v[Y][X], float dt, float out[Y][X]) {
for (int y = 0; y < P_Y; ++y) {
for (int x = 0; x < P_X; ++x) {
vec2i pidx = { x, y };
if (p_property(g_fluid, pidx)) {
// the caller must ensure there is never fluid in a boundary cell
float dy = (v[y][x] + v[y-1][x]) / 2;
float dx = (u[y][x] + u[y][x-1]) / 2;
vec2f prev = { x - dx*dt / k_side_length,
y - dy*dt / k_side_length };
out[y][x] = interpolate_p(q, prev);
}
}
}
}
vec2f velocity_at(vec2f pos) {
vec2f uidx = { pos.x / k_side_length - 1.f,
pos.y / k_side_length - 0.5f };
vec2f vidx = { pos.x / k_side_length - 0.5f,
pos.y / k_side_length - 1.f };
// out-of-bounds is handled in interpolate
float x = interpolate_u(g_u, uidx);
float y = interpolate_v(g_v, vidx);
return v2f(x,y);
}
float time_to(float p0, float p1, float v) {
if (fabsf(v) > 0.f) {
return (p1 - p0) / v;
} else {
return FLT_MAX;
}
}
// Collision detection was developed ad-hoc, but I should probably read
// A Fast Voxel Traversal Algorithm for Ray Tracing (1987)
// Note: Unfortunately, my collision detection via time_to depends
// on (x/y)*y == x, which is only approximately true for
// floating-point. Thus, occasionally particles will enter solid cells.
void advect_markers(float dt) {
for (size_t i = 0; i < g_markers_length; ++i) {
vec2f p = g_markers[i];
vec2f v = velocity_at(p);
vec2f np;
int x_idx = (int)floorf(p.x / k_side_length);
int y_idx = (int)floorf(p.y / k_side_length);
// next horizontal intersect
int x_dir = v.x > 0 ? 1 : -1;
int nx_idx = x_idx + (v.x > 0 ? 1 : 0);
np.x = nx_idx*k_side_length;
float t_x = time_to(p.x, np.x, v.x);
// at idx = x, we're on the boundary between x-1 and x
// if we're going left, the pressure cell we care about is x-1
// if we're going right, the pressure cell we care about is x
int x_idx_offset = v.x < 0 ? -1 : 0;
// next vertical intersect
int y_dir = v.y > 0 ? 1 : -1;
int ny_idx = y_idx + (v.y > 0 ? 1 : 0);
np.y = ny_idx*k_side_length;
float t_y = time_to(p.y, np.y, v.y);
// at idx = y, we're on the boundary between y-1 and y
// if we're going down, the pressure cell we care about is y-1
// if we're going up, the pressure cell we care about is y
int y_idx_offset = v.y < 0 ? -1 : 0;
float t_prev = 0.f;
float t_near = fminf(t_x, t_y);
while (t_near < dt) {
if (t_x < t_y) {
// entered new horizontal cell
if (g_solid[y_idx][nx_idx + x_idx_offset]) {
// hit! we're done going horizontal
p = v2f_add(p, v2f_mulf(t_prev, v));
dt -= t_prev;
t_near = 0;
v.x = 0.f;
t_x = FLT_MAX;
t_y = time_to(p.y, np.y, v.y);
} else {
// calculate next intersection
x_idx = nx_idx;
nx_idx = x_idx + x_dir;
np.x = nx_idx*k_side_length;
t_x = time_to(p.x, np.x, v.x);
}
} else {
// entered new vertical cell
if (g_solid[ny_idx + y_idx_offset][x_idx]) {
// hit! we're done going vertical
p = v2f_add(p, v2f_mulf(t_prev, v));
dt -= t_prev;
t_near = 0;
v.y = 0.f;
t_y = FLT_MAX;
t_x = time_to(p.x, np.x, v.x);
} else {
// calculate next intersection
y_idx = ny_idx;
ny_idx = y_idx + y_dir;
np.y = ny_idx*k_side_length;
t_y = time_to(p.y, np.y, v.y);
}
}
t_prev = t_near;
t_near = fminf(t_x, t_y);
}
float t = (t_near < FLT_MAX) ? dt : t_prev;
g_markers[i] = v2f_add(p, v2f_mulf(t, v));
}
}
void apply_body_forces(float v[Y][X], float dt) {
for (int y = 0; y < V_Y; ++y) {
for (int x = 0; x < V_X; ++x) {
v[y][x] += k_gravity * dt;
}
}
}
// pressure matrix
typedef struct sparse_entry_t {
int8_t a_diag;
} sparse_entry_t;
sparse_entry_t g_a[Y][X];
int8_t nonsolid_neighbor_count(int y, int x) {
// this function is only used on fluid cells, and the edge cells
// should never be fluid, so no bounds checks required
return 4 - g_solid[y][x-1] - g_solid[y][x+1]
- g_solid[y-1][x] - g_solid[y+1][x];
}
int8_t get_a_plus_i(int y, int x) {
return is_fluid(y,x+1) ? -1 : 0;
}
int8_t get_a_plus_j(int y, int x) {
return is_fluid(y+1,x) ? -1 : 0;
}
int8_t get_a_minus_i(int y, int x) {
return get_a_plus_i(y, x-1);
}
int8_t get_a_minus_j(int y, int x) {
return get_a_plus_j(y-1, x);
}
double g_precon[Y][X];
double g_q[Y][X];
void apply_preconditioner(double r[Y][X], double z[Y][X]) {
// Incomplete Cholesky
// A ~= LLᵀ
// L = F * E_inv + E
// calculate E_inv (precon)
for (int y = 0; y < Y; ++y) {
for (int x = 0; x < X; ++x) {
if (is_fluid(y, x)) {
double a = g_a[y][x].a_diag;
double b = sq(get_a_minus_i(y,x) * g_precon[y][x-1]);
double c = sq(get_a_minus_j(y,x) * g_precon[y-1][x]);
double e = a - b - c;
if (e < 0.25*a) {
e = a != 0 ? a : 1;
}
g_precon[y][x] = 1 / sqrt(e);
}
}
}
// solve Lq = r
memset(g_q, 0, sizeof(double)*Y*X);
for (int y = 0; y < Y; ++y) {
for (int x = 0; x < X; ++x) {
if (is_fluid(y, x)) {
double t = r[y][x]
- get_a_plus_i(y,x-1) * g_precon[y][x-1] * g_q[y][x-1]
- get_a_plus_j(y-1,x) * g_precon[y-1][x] * g_q[y-1][x];
g_q[y][x] = t * g_precon[y][x];
}
}
}
// solve Lᵀz = q
memset(z, 0, sizeof(double)*Y*X);
for (int y = Y; y--;) {
for (int x = X; x--;) {
if (is_fluid(y, x)) {
double t = g_q[y][x]
- get_a_plus_i(y,x) * g_precon[y][x] * z[y][x+1]
- get_a_plus_j(y,x) * g_precon[y][x] * z[y+1][x];
z[y][x] = t * g_precon[y][x];
}
}
}
}
double dot(double a[Y][X], double b[Y][X]) {
double total = 0.f;
for (int y = 0; y < Y; ++y) {
for (int x = 0; x < X; ++x) {
if (is_fluid(y, x)) {
total += a[y][x] * b[y][x];
}
}
}
return total;
}
bool all_zero(double r[Y][X]) {
for (int y = 0; y < Y; ++y) {
for (int x = 0; x < X; ++x) {
if (is_fluid(y, x)) {
if (r[y][x] != 0.f) {
return false;
}
}
}
}
return true;
}
double inf_norm(double r[Y][X]) {
double maximum = 0.f;
for (int y = 0; y < Y; ++y) {
for (int x = 0; x < X; ++x) {
if (is_fluid(y, x)) {
double a = fabs(r[y][x]);
if (a > maximum) {
maximum = a;
}
}
}
}
return maximum;
}
void update_search(double s[Y][X], double z[Y][X], double beta) {
for (int y = 0; y < Y; ++y) {
for (int x = 0; x < X; ++x) {
if (is_fluid(y, x)) {
s[y][x] = z[y][x] + beta * s[y][x];
}
}
}
}
void apply_a(double s[Y][X], double out[Y][X]) {
for (int y = 0; y < Y; ++y) {
for (int x = 0; x < X; ++x) {
if (is_fluid(y, x)) {
out[y][x] = g_a[y][x].a_diag * s[y][x]
- (is_fluid(y,x+1) ? s[y][x+1] : 0)
- (is_fluid(y+1,x) ? s[y+1][x] : 0)
- (is_fluid(y,x-1) ? s[y][x-1] : 0)
- (is_fluid(y-1,x) ? s[y-1][x] : 0);
}
}
}
}
// c += a*b
void fmadd(double a[Y][X], double b, double c[Y][X]) {
for (int y = 0; y < Y; ++y) {
for (int x = 0; x < X; ++x) {
if (is_fluid(y, x)) {
c[y][x] += a[y][x] * b;
}
}
}
}
// Acceleration due to pressure: -grad(p) / density
float accel(float delta_p) {
return -invf(k_density * k_side_length) * delta_p;
}
void project(float dt, float u[Y][X], float v[Y][X], float uout[Y][X], float vout[Y][X]) {
// Using -div(u) = laplacian(p) * dt / density.
// Solve Ap = b, with A = laplacian * dx²,
// b = -div(u) * density * dx² / dt
const double k_inv_scale = sqf(k_side_length) * k_density / dt;
// calculate b
double b[Y][X] = {};
for (int y = 0; y < Y; ++y) {
for (int x = 0; x < X; ++x) {
if (is_fluid(y,x)) {
double divergence = (u[y][x] - u[y][x-1] + v[y][x] - v[y-1][x]) / k_side_length;
b[y][x] = -divergence * k_inv_scale;
}
}
}
// calculate A
for (int y = 0; y < Y; ++y) {
for (int x = 0; x < X; ++x) {
if (is_fluid(y, x)) {
g_a[y][x].a_diag = nonsolid_neighbor_count(y, x);
}
}
}
const int max_iterations = 100;
const double tol = 1e-6f;
// conjugate gradient
double p[Y][X] = {}; // pressure guess
double r[Y][X]; // residual
memcpy(r, b, sizeof(r));
if (!all_zero(r)) {
double z[Y][X]; // auxiliary vector
apply_preconditioner(r, z);
double s[Y][X]; // search vector
memcpy(s, z, sizeof(s));
double sigma = dot(z,r);
for (int i = 0; i < max_iterations; ++i) {
apply_a(s, z);
double alpha = sigma / dot(z,s);
fmadd(s, alpha, p); // p += alpha*s
fmadd(z, -alpha, r); // r -= alpha*z
if (inf_norm(r) <= tol) {
break;
}
apply_preconditioner(r, z);
double sigma_new = dot(z,r);
double beta = sigma_new / sigma;
update_search(s,z,beta);
sigma = sigma_new;
}
}
// clamp pressure to zero or greater
// This step is not in Bridson's notes, but it fixes some weird artifacts.
// Without it, the pressure solve sometimes introduced negative pressures
// to eliminate divergence at solid boundaries, causing extreme stickyness
for (int y = 0; y < Y; ++y) {
for (int x = 0; x < X; ++x) {
if (is_fluid(y,x) && p[y][x] < 0.f) {
p[y][x] = 0.f;
}
}
}
// update horizontal velocities
for (int y = 0; y < U_Y; ++y) {
for (int x = 0; x < U_X; ++x) {
if (u_property(g_solid, v2i(x,y))) {
uout[y][x] = 0.f;
} else if (u_property(g_fluid, v2i(x,y))) {
uout[y][x] = u[y][x] + accel(p[y][x+1] - p[y][x]) * dt;
} else { // air
uout[y][x] = 0.f;
}
}
}
// update vertical velocities
for (int y = 0; y < V_Y; ++y) {
for (int x = 0; x < V_X; ++x) {
if (v_property(g_solid, v2i(x,y))) {
vout[y][x] = 0.f;
} else if (v_property(g_fluid, v2i(x,y))) {
vout[y][x] = v[y][x] + accel(p[y+1][x] - p[y][x]) * dt;
} else { // air
vout[y][x] = 0.f;
}
}
}
}
float maxsq(float q[Y][X], celltype_t type) {
vec2i size = grid_size(type);
float max = 0;
for (int y = 0; y < size.y; ++y) {
for (int x = 0; x < size.x; ++x) {
float value = sqf(q[y][x]);
if (value > max) {
max = value;
}
}
}
return max;
}
void zero_bounds(float q[Y][X], celltype_t type) {
vec2i size = grid_size(type);
for (int y = 0; y < size.y; ++y) {
for (int x = 0; x < size.x; ++x) {
// not really necessary to zero air cells, but makes debugging easier
if (!property(g_fluid, v2i(x,y), type) || property(g_solid, v2i(x,y), type)) {
q[y][x] = 0.f;
}
}
}
}
float calculate_timestep(float frame_time) {
// Bridson suggests a limit of five cells, but my implementation
// of advection and extrapolation assume that new fluid cells are
// within one grid cell of old fluid cells.
const float max_distance = 0.75f * k_side_length;
float max_velocity = sqrtf(maxsq(g_u, U) + maxsq(g_v, V));
return fminf(max_distance / max_velocity, frame_time);
}
void sim_step() {
if (g_pause && g_temp_unpause_counter == 0) {
return;
}
// split frame timestep into sub-steps
const float total_frame_time = 0.1f;
float frame_time = total_frame_time;
for (int step = 0; frame_time > 0.f && step < 8; ++step) {
float dt = calculate_timestep(frame_time);
frame_time -= dt;
advect_markers(dt);
refresh_marker_counts();
// extrapolate values for new fluid cells from their neighbours
if (g_rainbow_enabled) {
extrapolate(g_r, P);
extrapolate(g_g, P);
extrapolate(g_b, P);
}
update_fluid_sources();
extrapolate(g_u, U);
extrapolate(g_v, V);
zero_bounds(g_u, U);
zero_bounds(g_v, V);
// advect fluid properties along the fluid flow
advect_u(g_u, g_v, dt, g_utmp);
advect_v(g_u, g_v, dt, g_vtmp);
if (g_rainbow_enabled) {
advect_p(g_r, g_u, g_v, dt, g_rtmp);
memcpy(g_r, g_rtmp, sizeof(g_r));
advect_p(g_g, g_u, g_v, dt, g_gtmp);
memcpy(g_g, g_gtmp, sizeof(g_g));
advect_p(g_b, g_u, g_v, dt, g_btmp);
memcpy(g_b, g_btmp, sizeof(g_b));
}
// add acceleration due to gravity
apply_body_forces(g_vtmp, dt);
// set velocities constrained by solid boundaries
zero_bounds(g_utmp, U);
zero_bounds(g_vtmp, V);
// project our approximate solution for the updated velocity field
// to the nearest divergence-free solution
project(dt, g_utmp, g_vtmp, g_u, g_v);
}
if (g_temp_unpause_counter) {
g_temp_unpause_counter--;
}
g_frame_count++;
}
void buffer_append_color(buffer_t* buf, float r, float g, float b) {
char tmp[20];
int r_out = float_to_byte_color(linear_to_sRGB(r));
int g_out = float_to_byte_color(linear_to_sRGB(g));
int b_out = float_to_byte_color(linear_to_sRGB(b));
int length = snprintf(tmp, sizeof(tmp), "\x1B[38;2;%d;%d;%dm", r_out, g_out, b_out);
if (length < 0 || length >= (int)sizeof(tmp)) {
die("failed to format color");
}
buffer_append(buf, tmp, length);
}
void draw_rows(buffer_t* buf) {
const char* symbol[4] = {" ","o","O","0"};
const uint8_t max_symbol_idx = 3;
const int y_cutoff = max_i((int)Y-1 - g_wy, 1);
for (int y = Y-1; y-- > y_cutoff;) {
bool prev_water = false;
for (int x = 1; x < (int)X-1 && x < g_wx+1; x++) {
if (g_solid[y][x]) {
if (prev_water) {
buffer_appendz(buf, T_RESET);
}
buffer_appendz(buf, "X");
prev_water = false;
} else if (g_sink[y][x]) {
if (prev_water) {
buffer_appendz(buf, T_RESET);
}
buffer_appendz(buf, "=");
} else {
uint8_t i = min_u8(g_marker_count[y][x], max_symbol_idx);
bool has_water = i > 0;
if (!prev_water && has_water && !g_rainbow_enabled) {
buffer_appendz(buf, T_BLUE);
} else if (has_water && g_rainbow_enabled) {
buffer_append_color(buf, g_r[y][x], g_g[y][x], g_b[y][x]);
} else if (prev_water && !has_water) {
buffer_appendz(buf, T_RESET);
}
buffer_appendz(buf, symbol[i]);
prev_water = has_water;
}
}
buffer_appendz(buf, T_RESET T_CLEAR_LINE);
if (y > y_cutoff) {
buffer_appendz(buf, "\r\n");
}
}
}
void draw(buffer_t* buf) {
buffer_clear(buf);
reposition_cursor(buf);
draw_rows(buf);
hide_cursor(buf);
buffer_write(buf);
}
bool process_keypress() {
char c = '\0';
if (read(STDIN_FILENO, &c, 1) == -1 && errno != EAGAIN && errno != EINTR) {
die("read");
}
if (c == 'p') {
g_pause = !g_pause;
} else if (c == 'f') {
g_temp_unpause_counter++;
} else if (c == 'r') {
if (g_rainbow_enabled) {
colorize();
}
} else if (c == 'q') {
clear_screen_now();
return false;
}
return true;
}
args_t parse_args(int argc, char** argv) {
args_t in;
in.rainbow = false;
if (argc < 2) {
fprintf(stderr, "usage: %s [--rainbow] <scenario>\n", argv[0]);
exit(1);
}
for (int i = 1; i < argc - 1; ++i) {
if (!strcmp(argv[i], "--rainbow")) {
in.rainbow = true;
} else {
fprintf(stderr, "Unrecognized input: %s\n", argv[i]);
exit(1);
}
}
in.scenario_file = argv[argc-1];