20#ifndef _TGX_SHADERS_H_
21#define _TGX_SHADERS_H_
36 return ((v < 0) ? 0 : ((v > maxv) ? maxv : v));
44 template<
typename color_t,
typename ZBUFFER_t>
45 void shader_test(
const int32_t& offset,
const int32_t& lx,
const int32_t& ly,
46 const int32_t& dx1,
const int32_t& dy1, int32_t O1,
const tgx::RasterizerVec4& fP1,
47 const int32_t& dx2,
const int32_t& dy2, int32_t O2,
const tgx::RasterizerVec4& fP2,
48 const int32_t& dx3,
const int32_t& dy3, int32_t O3,
const tgx::RasterizerVec4& fP3,
49 const tgx::RasterizerParams<color_t, color_t, ZBUFFER_t>& data)
52 color_t* buf = data.im->data() + offset;
53 const int32_t stride = data.im->stride();
54 for (
int y = 0; y < ly; y++)
56 for (
int x = 0; x < lx; x++)
58 const int32_t o1 = O1 + dx1 * x + dy1 * y;
59 const int32_t o2 = O2 + dx2 * x + dy2 * y;
60 const int32_t o3 = O3 + dx3 * x + dy3 * y;
61 if ((o1 >= 0) && (o2 >= 0) && (o3 >= 0))
63 buf[x + stride * y].
blend256(col, 128);
73 template<
typename color_t,
typename ZBUFFER_t>
74 void shader_Flat(
const int32_t& offset,
const int32_t& lx,
const int32_t& ly,
75 const int32_t& dx1,
const int32_t& dy1, int32_t O1,
const RasterizerVec4& fP1,
76 const int32_t& dx2,
const int32_t& dy2, int32_t O2,
const RasterizerVec4& fP2,
77 const int32_t& dx3,
const int32_t& dy3, int32_t O3,
const RasterizerVec4& fP3,
78 const RasterizerParams<color_t, color_t, ZBUFFER_t>& data)
80 color_t col = (color_t)data.facecolor;
81 color_t* buf = data.im->data() + offset;
82 const int32_t stride = data.im->stride();
84 const uintptr_t end = (uintptr_t)(buf + (ly * stride));
86 while ((uintptr_t)(buf) < end)
92 bx = (-O1 + dx1 - 1) / dx1;
99 const int32_t by = (-O2 + dy2 - 1) / dy2;
103 const int32_t offs = by * stride;
107 bx =
max(bx, ((-O2 + dx2 - 1) / dx2));
113 if (dy3 <= 0)
return;
114 const int32_t by = (-O3 + dy3 - 1) / dy3;
118 const int32_t offs = by * stride;
122 bx =
max(bx, ((-O3 + dx3 - 1) / dx3));
125 int32_t C2 = O2 + (dx2 * bx);
126 int32_t C3 = O3 + (dx3 * bx);
127 while ((bx < lx) && ((C2 | C3) >= 0))
148 template<
typename color_t,
typename ZBUFFER_t>
150 const int32_t& dx1,
const int32_t& dy1, int32_t O1,
const RasterizerVec4& fP1,
151 const int32_t& dx2,
const int32_t& dy2, int32_t O2,
const RasterizerVec4& fP2,
152 const int32_t& dx3,
const int32_t& dy3, int32_t O3,
const RasterizerVec4& fP3,
153 const RasterizerParams<color_t, color_t, ZBUFFER_t>& data)
155 color_t* buf = data.im->data() + offset;
156 const int32_t stride = data.im->stride();
158 const color_t col1 = (color_t)fP1.color;
159 const color_t col2 = (color_t)fP2.color;
160 const color_t col3 = (color_t)fP3.color;
162 const uintptr_t end = (uintptr_t)(buf + (ly * stride));
163 const int32_t pa = O1 + O2 + O3;
164 const int32_t E = ((pa == 0) ? 1 : 0);
165 const int32_t aera = pa + E;
166 const int shiftC = (aera > (1 << 22)) ? 10 : 0;
168 while ((uintptr_t)(buf) < end)
174 bx = (-O1 + dx1 - 1) / dx1;
180 if (dy2 <= 0)
return;
181 const int32_t by = (-O2 + dy2 - 1) / dy2;
185 const int32_t offs = by * stride;
189 bx =
max(bx, ((-O2 + dx2 - 1) / dx2));
195 if (dy3 <= 0)
return;
196 const int32_t by = (-O3 + dy3 - 1) / dy3;
200 const int32_t offs = by * stride;
204 bx =
max(bx, ((-O3 + dx3 - 1) / dx3));
207 int32_t C2 = O2 + (dx2 * bx);
208 int32_t C3 = O3 + (dx3 * bx);
209 while ((bx < lx) && ((C2 | C3) >= 0))
229 template<
typename color_t,
typename ZBUFFER_t,
bool TEXTURE_BILINEAR,
bool TEXTURE_WRAP>
231 const int32_t dx1,
const int32_t dy1, int32_t O1,
const RasterizerVec4& fP1,
232 const int32_t dx2,
const int32_t dy2, int32_t O2,
const RasterizerVec4& fP2,
233 const int32_t dx3,
const int32_t dy3, int32_t O3,
const RasterizerVec4& fP3,
234 const RasterizerParams<color_t, color_t, ZBUFFER_t>& data)
236 color_t* buf = data.im->data() + offset;
237 const int32_t stride = data.im->stride();
239 const uintptr_t end = (uintptr_t)(buf + (ly * stride));
240 const int32_t pa = O1 + O2 + O3;
241 const int32_t E = ((pa == 0) ? 1 : 0);
242 const int32_t aera = pa + E;
245 const float invaera =
fast_inv((
float)aera);
246 const float fP1a = fP1.w * invaera;
247 const float fP2a = fP2.w * invaera;
248 const float fP3a = fP3.w * invaera;
250 const float dw = (dx1 * fP1a) + (dx2 * fP2a) + (dx3 * fP3a);
252 const RGBf& cf = (
RGBf)data.facecolor;
253 const int fPR = (
int)(256 * cf.
R);
254 const int fPG = (int)(256 * cf.
G);
255 const int fPB = (int)(256 * cf.
B);
262 const color_t* tex = data.tex->data();
263 const int32_t texsize_x = data.tex->width();
264 const int32_t texsize_y = data.tex->height();
265 const int32_t texsize_x_mm = texsize_x - 1;
266 const int32_t texsize_y_mm = texsize_y - 1;
267 const int32_t texstride = data.tex->stride();
280 const float dtx = ((T1.
x * dx1) + (T2.
x * dx2) + (T3.
x * dx3));
281 const float dty = ((T1.
y * dx1) + (T2.
y * dx2) + (T3.
y * dx3));
283 while ((uintptr_t)(buf) < end)
289 bx = (-O1 + dx1 - 1) / dx1;
295 if (dy2 <= 0)
return;
296 const int32_t by = (-O2 + dy2 - 1) / dy2;
300 const int32_t offs = by * stride;
304 bx =
max(bx, ((-O2 + dx2 - 1) / dx2));
310 if (dy3 <= 0)
return;
311 const int32_t by = (-O3 + dy3 - 1) / dy3;
315 const int32_t offs = by * stride;
319 bx =
max(bx, ((-O3 + dx3 - 1) / dx3));
322 int32_t C1 = O1 + (dx1 * bx) + E;
323 int32_t C2 = O2 + (dx2 * bx);
324 int32_t C3 = O3 + (dx3 * bx);
325 float cw = ((C1 * fP1a) + (C2 * fP2a) + (C3 * fP3a));
327 float tx = ((T1.
x * C1) + (T2.
x * C2) + (T3.
x * C3));
328 float ty = ((T1.
y * C1) + (T2.
y * C2) + (T3.
y * C3));
330 while ((bx < lx) && ((C2 | C3) >= 0))
335 if (TEXTURE_BILINEAR)
337 const float xx = tx * icw;
338 const float yy = ty * icw;
339 const int ttx = (int)floorf(xx);
340 const int tty = (int)floorf(yy);
341 const float ax = xx - ttx;
342 const float ay = yy - tty;
343 const int minx = (TEXTURE_WRAP ? (ttx & (texsize_x_mm)) :
shaderclip(ttx, texsize_x_mm));
344 const int maxx = (TEXTURE_WRAP ? ((ttx + 1) & (texsize_x_mm)) :
shaderclip(ttx + 1, texsize_x_mm));
345 const int miny = (TEXTURE_WRAP ? ((tty & (texsize_y_mm))*texstride) :
shaderclip(tty, texsize_y_mm) * texstride);
346 const int maxy = (TEXTURE_WRAP ? (((tty + 1) & (texsize_y_mm))*texstride) :
shaderclip(tty + 1, texsize_y_mm) * texstride);
351 const int ttx = (TEXTURE_WRAP ? ((int)((tx * icw))) & (texsize_x_mm) :
shaderclip((
int)(tx * icw), texsize_x_mm));
352 const int tty = (TEXTURE_WRAP ? ((int)((ty * icw))) & (texsize_y_mm) :
shaderclip((
int)(ty * icw), texsize_y_mm));
353 col = tex[ttx + (tty)*texstride];
356 col.mult256(fPR, fPG, fPB);
381 template<
typename color_t,
typename ZBUFFER_t,
bool TEXTURE_BILINEAR,
bool TEXTURE_WRAP>
383 const int32_t dx1,
const int32_t dy1, int32_t O1,
const RasterizerVec4& fP1,
384 const int32_t dx2,
const int32_t dy2, int32_t O2,
const RasterizerVec4& fP2,
385 const int32_t dx3,
const int32_t dy3, int32_t O3,
const RasterizerVec4& fP3,
386 const RasterizerParams<color_t, color_t, ZBUFFER_t>& data)
389 color_t* buf = data.im->data() + offset;
390 const int32_t stride = data.im->stride();
392 const uintptr_t end = (uintptr_t)(buf + (ly * stride));
393 const int32_t pa = O1 + O2 + O3;
394 const int32_t E = ((pa == 0) ? 1 : 0);
395 const int32_t aera = pa + E;
397 const float invaera =
fast_inv((
float)aera);
398 const float fP1a = fP1.w * invaera;
399 const float fP2a = fP2.w * invaera;
400 const float fP3a = fP3.w * invaera;
402 const float dw = (dx1 * fP1a) + (dx2 * fP2a) + (dx3 * fP3a);
407 const int fP1R = (
int)(256 * cf1.
R);
408 const int fP1G = (int)(256 * cf1.
G);
409 const int fP1B = (int)(256 * cf1.
B);
410 const int fP21R = (int)(256 * (cf2.R - cf1.
R));
411 const int fP21G = (int)(256 * (cf2.G - cf1.
G));
412 const int fP21B = (int)(256 * (cf2.B - cf1.
B));
413 const int fP31R = (int)(256 * (cf3.
R - cf1.
R));
414 const int fP31G = (int)(256 * (cf3.
G - cf1.
G));
415 const int fP31B = (int)(256 * (cf3.
B - cf1.
B));
422 const color_t* tex = data.tex->data();
423 const int32_t texsize_x = data.tex->width();
424 const int32_t texsize_y = data.tex->height();
425 const int32_t texsize_x_mm = texsize_x - 1;
426 const int32_t texsize_y_mm = texsize_y - 1;
427 const int32_t texstride = data.tex->stride();
441 const float dtx = ((T1.
x * dx1) + (T2.
x * dx2) + (T3.
x * dx3));
442 const float dty = ((T1.
y * dx1) + (T2.
y * dx2) + (T3.
y * dx3));
444 while ((uintptr_t)(buf) < end)
450 bx = (-O1 + dx1 - 1) / dx1;
456 if (dy2 <= 0)
return;
457 const int32_t by = (-O2 + dy2 - 1) / dy2;
461 const int32_t offs = by * stride;
465 bx =
max(bx, ((-O2 + dx2 - 1) / dx2));
471 if (dy3 <= 0)
return;
472 const int32_t by = (-O3 + dy3 - 1) / dy3;
476 const int32_t offs = by * stride;
480 bx =
max(bx, ((-O3 + dx3 - 1) / dx3));
483 int32_t C1 = O1 + (dx1 * bx) + E;
484 int32_t C2 = O2 + (dx2 * bx);
485 int32_t C3 = O3 + (dx3 * bx);
486 float cw = ((C1 * fP1a) + (C2 * fP2a) + (C3 * fP3a));
488 float tx = ((T1.
x * C1) + (T2.
x * C2) + (T3.
x * C3));
489 float ty = ((T1.
y * C1) + (T2.
y * C2) + (T3.
y * C3));
491 while ((bx < lx) && ((C2 | C3) >= 0))
496 if (TEXTURE_BILINEAR)
498 const float xx = tx * icw;
499 const float yy = ty * icw;
500 const int ttx = (int)floorf(xx);
501 const int tty = (int)floorf(yy);
502 const float ax = xx - ttx;
503 const float ay = yy - tty;
504 const int minx = (TEXTURE_WRAP ? (ttx & (texsize_x_mm)) :
shaderclip(ttx, texsize_x_mm));
505 const int maxx = (TEXTURE_WRAP ? ((ttx + 1) & (texsize_x_mm)) :
shaderclip(ttx + 1, texsize_x_mm));
506 const int miny = (TEXTURE_WRAP ? ((tty & (texsize_y_mm)) * texstride) :
shaderclip(tty, texsize_y_mm) * texstride);
507 const int maxy = (TEXTURE_WRAP ? (((tty + 1) & (texsize_y_mm)) * texstride) :
shaderclip(tty + 1, texsize_y_mm) * texstride);
512 const int ttx = (TEXTURE_WRAP ? ((int)((tx * icw))) & (texsize_x_mm) :
shaderclip((
int)(tx * icw), texsize_x_mm));
513 const int tty = (TEXTURE_WRAP ? ((int)((ty * icw))) & (texsize_y_mm) :
shaderclip((
int)(ty * icw), texsize_y_mm));
514 col = tex[ttx + (tty)*texstride];
517 const int r = fP1R + ((C2 * fP21R + C3 * fP31R) / aera);
518 const int g = fP1G + ((C2 * fP21G + C3 * fP31G) / aera);
519 const int b = fP1B + ((C2 * fP21B + C3 * fP31B) / aera);
521 col.mult256(r, g, b);
546 template<
typename color_t,
typename ZBUFFER_t>
548 const int32_t& dx1,
const int32_t& dy1, int32_t O1,
const RasterizerVec4& fP1,
549 const int32_t& dx2,
const int32_t& dy2, int32_t O2,
const RasterizerVec4& fP2,
550 const int32_t& dx3,
const int32_t& dy3, int32_t O3,
const RasterizerVec4& fP3,
551 const RasterizerParams<color_t, color_t, ZBUFFER_t>& data)
553 const color_t col = (color_t)data.facecolor;
554 color_t* buf = data.im->data() + offset;
555 ZBUFFER_t * zbuf = data.zbuf + offset;
557 const int32_t stride = data.im->stride();
558 const int32_t zstride = data.im->lx();
560 const uintptr_t end = (uintptr_t)(buf + (ly * stride));
561 const int32_t pa = O1 + O2 + O3;
562 const int32_t E = ((pa == 0) ? 1 : 0);
563 const int32_t aera = pa + E;
565 const float wa = data.wa;
566 const float wb = data.wb;
567 const float invaera =
fast_inv((
float)aera);
568 const float invaera_wa = invaera * wa;
569 const float fP1a = fP1.w * invaera_wa;
570 const float fP2a = fP2.w * invaera_wa;
571 const float fP3a = fP3.w * invaera_wa;
572 const float dw = (dx1 * fP1a) + (dx2 * fP2a) + (dx3 * fP3a);
574 while ((uintptr_t)(buf) < end)
580 bx = (-O1 + dx1 - 1) / dx1;
586 if (dy2 <= 0)
return;
587 const int32_t by = (-O2 + dy2 - 1) / dy2;
591 const int32_t offs = by * stride;
596 bx =
max(bx, ((-O2 + dx2 - 1) / dx2));
602 if (dy3 <= 0)
return;
603 const int32_t by = (-O3 + dy3 - 1) / dy3;
607 const int32_t offs = by * stride;
612 bx =
max(bx, ((-O3 + dx3 - 1) / dx3));
615 const int32_t C1 = O1 + (dx1 * bx) + E;
616 int32_t C2 = O2 + (dx2 * bx);
617 int32_t C3 = O3 + (dx3 * bx);
618 float cw = ((C1 * fP1a) + (C2 * fP2a) + (C3 * fP3a)) + wb;
620 while ((bx < lx) && ((C2 | C3) >= 0))
622 ZBUFFER_t& W = zbuf[bx];
623 const ZBUFFER_t aa = (ZBUFFER_t)(cw);
648 template<
typename color_t,
typename ZBUFFER_t>
650 const int32_t dx1,
const int32_t dy1, int32_t O1,
const RasterizerVec4& fP1,
651 const int32_t dx2,
const int32_t dy2, int32_t O2,
const RasterizerVec4& fP2,
652 const int32_t dx3,
const int32_t dy3, int32_t O3,
const RasterizerVec4& fP3,
653 const RasterizerParams<color_t, color_t, ZBUFFER_t>& data)
655 color_t* buf = data.im->data() + offset;
656 ZBUFFER_t* zbuf = data.zbuf + offset;
659 const int32_t stride = data.im->stride();
660 const int32_t zstride = data.im->lx();
662 const color_t col1 = (color_t)fP1.color;
663 const color_t col2 = (color_t)fP2.color;
664 const color_t col3 = (color_t)fP3.color;
666 const uintptr_t end = (uintptr_t)(buf + (ly * stride));
667 const int32_t pa = O1 + O2 + O3;
668 const int32_t E = ((pa == 0) ? 1 : 0);
669 const int32_t aera = pa + E;
670 const int shiftC = (aera > (1 << 22)) ? 10 : 0;
672 const float wa = data.wa;
673 const float wb = data.wb;
674 const float invaera =
fast_inv((
float)aera);
675 const float invaera_wa = invaera * wa;
676 const float fP1a = fP1.w * invaera_wa;
677 const float fP2a = fP2.w * invaera_wa;
678 const float fP3a = fP3.w * invaera_wa;
679 const float dw = (dx1 * fP1a) + (dx2 * fP2a) + (dx3 * fP3a);
681 while ((uintptr_t)(buf) < end)
687 bx = (-O1 + dx1 - 1) / dx1;
693 if (dy2 <= 0)
return;
694 const int32_t by = (-O2 + dy2 - 1) / dy2;
698 const int32_t offs = by * stride;
703 bx =
max(bx, ((-O2 + dx2 - 1) / dx2));
709 if (dy3 <= 0)
return;
710 const int32_t by = (-O3 + dy3 - 1) / dy3;
714 const int32_t offs = by * stride;
719 bx =
max(bx, ((-O3 + dx3 - 1) / dx3));
722 const int32_t C1 = O1 + (dx1 * bx) + E;
723 int32_t C2 = O2 + (dx2 * bx);
724 int32_t C3 = O3 + (dx3 * bx);
725 float cw = ((C1 * fP1a) + (C2 * fP2a) + (C3 * fP3a)) + wb;
727 while ((bx < lx) && ((C2 | C3) >= 0))
729 ZBUFFER_t& W = zbuf[bx];
730 const ZBUFFER_t aa = (ZBUFFER_t)(cw);
754 template<
typename color_t,
typename ZBUFFER_t,
bool TEXTURE_BILINEAR,
bool TEXTURE_WRAP>
756 const int32_t dx1,
const int32_t dy1, int32_t O1,
const RasterizerVec4& fP1,
757 const int32_t dx2,
const int32_t dy2, int32_t O2,
const RasterizerVec4& fP2,
758 const int32_t dx3,
const int32_t dy3, int32_t O3,
const RasterizerVec4& fP3,
759 const RasterizerParams<color_t, color_t, ZBUFFER_t>& data)
761 color_t* buf = data.im->data() + offset;
762 ZBUFFER_t* zbuf = data.zbuf + offset;
764 const float wa = data.wa;
765 const float wb = data.wb;
770 const int32_t stride = data.im->stride();
771 const int32_t zstride = data.im->lx();
773 const uintptr_t end = (uintptr_t)(buf + (ly * stride));
774 const int32_t pa = O1 + O2 + O3;
775 const int32_t E = ((pa == 0) ? 1 : 0);
776 const int32_t aera = pa + E;
778 const float invaera =
fast_inv((
float)aera);
779 const float fP1a = fP1.w * invaera;
780 const float fP2a = fP2.w * invaera;
781 const float fP3a = fP3.w * invaera;
783 const float dw = (dx1 * fP1a) + (dx2 * fP2a) + (dx3 * fP3a);
785 const RGBf& cf = (
RGBf)data.facecolor;
786 const int fPR = (
int)(256 * cf.
R);
787 const int fPG = (int)(256 * cf.
G);
788 const int fPB = (int)(256 * cf.
B);
795 const color_t* tex = data.tex->data();
796 const int32_t texsize_x = data.tex->width();
797 const int32_t texsize_y = data.tex->height();
798 const int32_t texsize_x_mm = texsize_x - 1;
799 const int32_t texsize_y_mm = texsize_y - 1;
800 const int32_t texstride = data.tex->stride();
813 const float dtx = ((T1.
x * dx1) + (T2.
x * dx2) + (T3.
x * dx3));
814 const float dty = ((T1.
y * dx1) + (T2.
y * dx2) + (T3.
y * dx3));
816 while ((uintptr_t)(buf) < end)
822 bx = (-O1 + dx1 - 1) / dx1;
828 if (dy2 <= 0)
return;
829 const int32_t by = (-O2 + dy2 - 1) / dy2;
833 const int32_t offs = by * stride;
838 bx =
max(bx, ((-O2 + dx2 - 1) / dx2));
844 if (dy3 <= 0)
return;
845 const int32_t by = (-O3 + dy3 - 1) / dy3;
849 const int32_t offs = by * stride;
854 bx =
max(bx, ((-O3 + dx3 - 1) / dx3));
857 int32_t C1 = O1 + (dx1 * bx) + E;
858 int32_t C2 = O2 + (dx2 * bx);
859 int32_t C3 = O3 + (dx3 * bx);
860 float cw = ((C1 * fP1a) + (C2 * fP2a) + (C3 * fP3a));
862 float tx = ((T1.
x * C1) + (T2.
x * C2) + (T3.
x * C3));
863 float ty = ((T1.
y * C1) + (T2.
y * C2) + (T3.
y * C3));
865 while ((bx < lx) && ((C2 | C3) >= 0))
867 ZBUFFER_t& W = zbuf[bx];
868 const ZBUFFER_t aa = (std::is_same<ZBUFFER_t, uint16_t>::value) ? ((ZBUFFER_t)(cw * wa + wb)) : ((ZBUFFER_t)cw);
874 if (TEXTURE_BILINEAR)
876 const float xx = tx * icw;
877 const float yy = ty * icw;
878 const int ttx = (int)floorf(xx);
879 const int tty = (int)floorf(yy);
880 const float ax = xx - ttx;
881 const float ay = yy - tty;
882 const int minx = (TEXTURE_WRAP ? (ttx & (texsize_x_mm)) :
shaderclip(ttx, texsize_x_mm));
883 const int maxx = (TEXTURE_WRAP ? ((ttx + 1) & (texsize_x_mm)) :
shaderclip(ttx + 1, texsize_x_mm));
884 const int miny = (TEXTURE_WRAP ? ((tty & (texsize_y_mm)) * texstride) :
shaderclip(tty, texsize_y_mm) * texstride);
885 const int maxy = (TEXTURE_WRAP ? (((tty + 1) & (texsize_y_mm)) * texstride) :
shaderclip(tty + 1, texsize_y_mm) * texstride);
890 const int ttx = (TEXTURE_WRAP ? ((int)((tx * icw))) & (texsize_x_mm) :
shaderclip((
int)(tx * icw), texsize_x_mm));
891 const int tty = (TEXTURE_WRAP ? ((int)((ty * icw))) & (texsize_y_mm) :
shaderclip((
int)(ty * icw), texsize_y_mm));
892 col = tex[ttx + (tty)*texstride];
895 col.mult256(fPR, fPG, fPB);
922 template<
typename color_t,
typename ZBUFFER_t,
bool TEXTURE_BILINEAR,
bool TEXTURE_WRAP>
924 const int32_t dx1,
const int32_t dy1, int32_t O1,
const RasterizerVec4& fP1,
925 const int32_t dx2,
const int32_t dy2, int32_t O2,
const RasterizerVec4& fP2,
926 const int32_t dx3,
const int32_t dy3, int32_t O3,
const RasterizerVec4& fP3,
927 const RasterizerParams<color_t, color_t, ZBUFFER_t>& data)
929 color_t* buf = data.im->data() + offset;
930 ZBUFFER_t* zbuf = data.zbuf + offset;
932 const float wa = data.wa;
933 const float wb = data.wb;
937 const int32_t stride = data.im->stride();
938 const int32_t zstride = data.im->lx();
940 const uintptr_t end = (uintptr_t)(buf + (ly * stride));
941 const int32_t pa = O1 + O2 + O3;
942 const int32_t E = ((pa == 0) ? 1 : 0);
943 const int32_t aera = pa + E;
945 const float invaera =
fast_inv((
float)aera);
946 const float fP1a = fP1.w * invaera;
947 const float fP2a = fP2.w * invaera;
948 const float fP3a = fP3.w * invaera;
950 const float dw = (dx1 * fP1a) + (dx2 * fP2a) + (dx3 * fP3a);
955 const int fP1R = (
int)(256 * cf1.
R);
956 const int fP1G = (int)(256 * cf1.
G);
957 const int fP1B = (int)(256 * cf1.
B);
958 const int fP21R = (int)(256 * (cf2.R - cf1.
R));
959 const int fP21G = (int)(256 * (cf2.G - cf1.
G));
960 const int fP21B = (int)(256 * (cf2.B - cf1.
B));
961 const int fP31R = (int)(256 * (cf3.
R - cf1.
R));
962 const int fP31G = (int)(256 * (cf3.
G - cf1.
G));
963 const int fP31B = (int)(256 * (cf3.
B - cf1.
B));
970 const color_t* tex = data.tex->data();
971 const int32_t texsize_x = data.tex->width();
972 const int32_t texsize_y = data.tex->height();
973 const int32_t texsize_x_mm = texsize_x - 1;
974 const int32_t texsize_y_mm = texsize_y - 1;
975 const int32_t texstride = data.tex->stride();
988 const float dtx = ((T1.
x * dx1) + (T2.
x * dx2) + (T3.
x * dx3));
989 const float dty = ((T1.
y * dx1) + (T2.
y * dx2) + (T3.
y * dx3));
991 while ((uintptr_t)(buf) < end)
997 bx = (-O1 + dx1 - 1) / dx1;
1003 if (dy2 <= 0)
return;
1004 const int32_t by = (-O2 + dy2 - 1) / dy2;
1008 const int32_t offs = by * stride;
1013 bx =
max(bx, ((-O2 + dx2 - 1) / dx2));
1019 if (dy3 <= 0)
return;
1020 const int32_t by = (-O3 + dy3 - 1) / dy3;
1024 const int32_t offs = by * stride;
1029 bx =
max(bx, ((-O3 + dx3 - 1) / dx3));
1031 int32_t C1 = O1 + (dx1 * bx) + E;
1032 int32_t C2 = O2 + (dx2 * bx);
1033 int32_t C3 = O3 + (dx3 * bx);
1034 float cw = ((C1 * fP1a) + (C2 * fP2a) + (C3 * fP3a));
1036 float tx = ((T1.
x * C1) + (T2.
x * C2) + (T3.
x * C3));
1037 float ty = ((T1.
y * C1) + (T2.
y * C2) + (T3.
y * C3));
1039 while ((bx < lx) && ((C2 | C3) >= 0))
1041 ZBUFFER_t& W = zbuf[bx];
1042 const ZBUFFER_t aa = (std::is_same<ZBUFFER_t, uint16_t>::value) ? ((ZBUFFER_t)(cw * wa + wb)) : ((ZBUFFER_t)cw);
1049 if (TEXTURE_BILINEAR)
1051 const float xx = tx * icw;
1052 const float yy = ty * icw;
1053 const int ttx = (int)floorf(xx);
1054 const int tty = (int)floorf(yy);
1055 const float ax = xx - ttx;
1056 const float ay = yy - tty;
1057 const int minx = (TEXTURE_WRAP ? (ttx & (texsize_x_mm)) :
shaderclip(ttx, texsize_x_mm));
1058 const int maxx = (TEXTURE_WRAP ? ((ttx + 1) & (texsize_x_mm)) :
shaderclip(ttx + 1, texsize_x_mm));
1059 const int miny = (TEXTURE_WRAP ? ((tty & (texsize_y_mm)) * texstride) :
shaderclip(tty, texsize_y_mm) * texstride);
1060 const int maxy = (TEXTURE_WRAP ? (((tty + 1) & (texsize_y_mm)) * texstride) :
shaderclip(tty + 1, texsize_y_mm) * texstride);
1065 const int ttx = (TEXTURE_WRAP ? ((int)((tx * icw))) & (texsize_x_mm) :
shaderclip((
int)(tx * icw), texsize_x_mm));
1066 const int tty = (TEXTURE_WRAP ? ((int)((ty * icw))) & (texsize_y_mm) :
shaderclip((
int)(ty * icw), texsize_y_mm));
1067 col = tex[ttx + (tty)*texstride];
1070 const int r = fP1R + ((C2 * fP21R + C3 * fP31R) / aera);
1071 const int g = fP1G + ((C2 * fP21G + C3 * fP31G) / aera);
1072 const int b = fP1B + ((C2 * fP21B + C3 * fP31B) / aera);
1073 col.mult256(r, g, b);
1100 template<
typename color_t,
typename ZBUFFER_t,
bool TEXTURE_BILINEAR,
bool TEXTURE_WRAP>
1102 const int32_t dx1,
const int32_t dy1, int32_t O1,
const RasterizerVec4& fP1,
1103 const int32_t dx2,
const int32_t dy2, int32_t O2,
const RasterizerVec4& fP2,
1104 const int32_t dx3,
const int32_t dy3, int32_t O3,
const RasterizerVec4& fP3,
1105 const RasterizerParams<color_t, color_t, ZBUFFER_t>& data)
1107 color_t* buf = data.im->data() + offset;
1108 const int32_t stride = data.im->stride();
1110 const uintptr_t end = (uintptr_t)(buf + (ly * stride));
1111 const int32_t pa = O1 + O2 + O3;
1112 const int32_t E = ((pa == 0) ? 1 : 0);
1113 const int32_t aera = pa + E;
1115 const float invaera =
fast_inv((
float)aera);
1117 const RGBf& cf = (
RGBf)data.facecolor;
1118 const int fPR = (
int)(256 * cf.
R);
1119 const int fPG = (int)(256 * cf.
G);
1120 const int fPB = (int)(256 * cf.
B);
1127 const color_t* tex = data.tex->data();
1128 const int32_t texsize_x = data.tex->width();
1129 const int32_t texsize_y = data.tex->height();
1130 const int32_t texsize_x_mm = texsize_x - 1;
1131 const int32_t texsize_y_mm = texsize_y - 1;
1132 const int32_t texstride = data.tex->stride();
1145 const float dtx = ((T1.
x * dx1) + (T2.
x * dx2) + (T3.
x * dx3));
1146 const float dty = ((T1.
y * dx1) + (T2.
y * dx2) + (T3.
y * dx3));
1148 while ((uintptr_t)(buf) < end)
1154 bx = (-O1 + dx1 - 1) / dx1;
1160 if (dy2 <= 0)
return;
1161 const int32_t by = (-O2 + dy2 - 1) / dy2;
1165 const int32_t offs = by * stride;
1169 bx =
max(bx, ((-O2 + dx2 - 1) / dx2));
1175 if (dy3 <= 0)
return;
1176 const int32_t by = (-O3 + dy3 - 1) / dy3;
1180 const int32_t offs = by * stride;
1184 bx =
max(bx, ((-O3 + dx3 - 1) / dx3));
1186 int32_t C1 = O1 + (dx1 * bx) + E;
1187 int32_t C2 = O2 + (dx2 * bx);
1188 int32_t C3 = O3 + (dx3 * bx);
1190 float tx = ((T1.
x * C1) + (T2.
x * C2) + (T3.
x * C3));
1191 float ty = ((T1.
y * C1) + (T2.
y * C2) + (T3.
y * C3));
1193 while ((bx < lx) && ((C2 | C3) >= 0))
1197 if (TEXTURE_BILINEAR)
1199 const float xx = tx;
1200 const float yy = ty;
1201 const int ttx = (int)floorf(xx);
1202 const int tty = (int)floorf(yy);
1203 const float ax = xx - ttx;
1204 const float ay = yy - tty;
1205 const int minx = (TEXTURE_WRAP ? (ttx & (texsize_x_mm)) :
shaderclip(ttx, texsize_x_mm));
1206 const int maxx = (TEXTURE_WRAP ? ((ttx + 1) & (texsize_x_mm)) :
shaderclip(ttx + 1, texsize_x_mm));
1207 const int miny = (TEXTURE_WRAP ? ((tty & (texsize_y_mm)) * texstride) :
shaderclip(tty, texsize_y_mm) * texstride);
1208 const int maxy = (TEXTURE_WRAP ? (((tty + 1) & (texsize_y_mm)) * texstride) :
shaderclip(tty + 1, texsize_y_mm) * texstride);
1213 const int ttx = (TEXTURE_WRAP ? ((int)((tx))) & (texsize_x_mm) :
shaderclip((
int)(tx), texsize_x_mm));
1214 const int tty = (TEXTURE_WRAP ? ((int)((ty))) & (texsize_y_mm) :
shaderclip((
int)(ty), texsize_y_mm));
1215 col = tex[ttx + (tty)*texstride];
1218 col.mult256(fPR, fPG, fPB);
1242 template<
typename color_t,
typename ZBUFFER_t,
bool TEXTURE_BILINEAR,
bool TEXTURE_WRAP>
1244 const int32_t dx1,
const int32_t dy1, int32_t O1,
const RasterizerVec4& fP1,
1245 const int32_t dx2,
const int32_t dy2, int32_t O2,
const RasterizerVec4& fP2,
1246 const int32_t dx3,
const int32_t dy3, int32_t O3,
const RasterizerVec4& fP3,
1247 const RasterizerParams<color_t, color_t, ZBUFFER_t>& data)
1249 color_t* buf = data.im->data() + offset;
1250 const int32_t stride = data.im->stride();
1252 const uintptr_t end = (uintptr_t)(buf + (ly * stride));
1253 const int32_t pa = O1 + O2 + O3;
1254 const int32_t E = ((pa == 0) ? 1 : 0);
1255 const int32_t aera = pa + E;
1257 const float invaera =
fast_inv((
float)aera);
1262 const int fP1R = (
int)(256 * cf1.
R);
1263 const int fP1G = (int)(256 * cf1.
G);
1264 const int fP1B = (int)(256 * cf1.
B);
1265 const int fP21R = (int)(256 * (cf2.R - cf1.
R));
1266 const int fP21G = (int)(256 * (cf2.G - cf1.
G));
1267 const int fP21B = (int)(256 * (cf2.B - cf1.
B));
1268 const int fP31R = (int)(256 * (cf3.
R - cf1.
R));
1269 const int fP31G = (int)(256 * (cf3.
G - cf1.
G));
1270 const int fP31B = (int)(256 * (cf3.
B - cf1.
B));
1277 const color_t* tex = data.tex->data();
1278 const int32_t texsize_x = data.tex->width();
1279 const int32_t texsize_y = data.tex->height();
1280 const int32_t texsize_x_mm = texsize_x - 1;
1281 const int32_t texsize_y_mm = texsize_y - 1;
1282 const int32_t texstride = data.tex->stride();
1295 const float dtx = ((T1.
x * dx1) + (T2.
x * dx2) + (T3.
x * dx3));
1296 const float dty = ((T1.
y * dx1) + (T2.
y * dx2) + (T3.
y * dx3));
1298 while ((uintptr_t)(buf) < end)
1304 bx = (-O1 + dx1 - 1) / dx1;
1310 if (dy2 <= 0)
return;
1311 const int32_t by = (-O2 + dy2 - 1) / dy2;
1315 const int32_t offs = by * stride;
1319 bx =
max(bx, ((-O2 + dx2 - 1) / dx2));
1325 if (dy3 <= 0)
return;
1326 const int32_t by = (-O3 + dy3 - 1) / dy3;
1330 const int32_t offs = by * stride;
1334 bx =
max(bx, ((-O3 + dx3 - 1) / dx3));
1337 int32_t C1 = O1 + (dx1 * bx) + E;
1338 int32_t C2 = O2 + (dx2 * bx);
1339 int32_t C3 = O3 + (dx3 * bx);
1341 float tx = ((T1.
x * C1) + (T2.
x * C2) + (T3.
x * C3));
1342 float ty = ((T1.
y * C1) + (T2.
y * C2) + (T3.
y * C3));
1344 while ((bx < lx) && ((C2 | C3) >= 0))
1348 if (TEXTURE_BILINEAR)
1350 const float xx = tx;
1351 const float yy = ty;
1352 const int ttx = (int)floorf(xx);
1353 const int tty = (int)floorf(yy);
1354 const float ax = xx - ttx;
1355 const float ay = yy - tty;
1356 const int minx = (TEXTURE_WRAP ? (ttx & (texsize_x_mm)) :
shaderclip(ttx, texsize_x_mm));
1357 const int maxx = (TEXTURE_WRAP ? ((ttx + 1) & (texsize_x_mm)) :
shaderclip(ttx + 1, texsize_x_mm));
1358 const int miny = (TEXTURE_WRAP ? ((tty & (texsize_y_mm)) * texstride) :
shaderclip(tty, texsize_y_mm) * texstride);
1359 const int maxy = (TEXTURE_WRAP ? (((tty + 1) & (texsize_y_mm)) * texstride) :
shaderclip(tty + 1, texsize_y_mm) * texstride);
1364 const int ttx = (TEXTURE_WRAP ? ((int)((tx))) & (texsize_x_mm) :
shaderclip((
int)(tx), texsize_x_mm));
1365 const int tty = (TEXTURE_WRAP ? ((int)((ty))) & (texsize_y_mm) :
shaderclip((
int)(ty), texsize_y_mm));
1366 col = tex[ttx + (tty)*texstride];
1369 const int r = fP1R + ((C2 * fP21R + C3 * fP31R) / aera);
1370 const int g = fP1G + ((C2 * fP21G + C3 * fP31G) / aera);
1371 const int b = fP1B + ((C2 * fP21B + C3 * fP31B) / aera);
1372 col.mult256(r, g, b);
1396 template<
typename color_t,
typename ZBUFFER_t,
bool TEXTURE_BILINEAR,
bool TEXTURE_WRAP>
1398 const int32_t dx1,
const int32_t dy1, int32_t O1,
const RasterizerVec4& fP1,
1399 const int32_t dx2,
const int32_t dy2, int32_t O2,
const RasterizerVec4& fP2,
1400 const int32_t dx3,
const int32_t dy3, int32_t O3,
const RasterizerVec4& fP3,
1401 const RasterizerParams<color_t, color_t, ZBUFFER_t>& data)
1403 color_t* buf = data.im->data() + offset;
1404 ZBUFFER_t* zbuf = data.zbuf + offset;
1406 const float wa = data.wa;
1407 const float wb = data.wb;
1411 const int32_t stride = data.im->stride();
1412 const int32_t zstride = data.im->lx();
1414 const uintptr_t end = (uintptr_t)(buf + (ly * stride));
1415 const int32_t pa = O1 + O2 + O3;
1416 const int32_t E = ((pa == 0) ? 1 : 0);
1417 const int32_t aera = pa + E;
1419 const float invaera =
fast_inv((
float)aera);
1420 const float fP1a = fP1.w * invaera;
1421 const float fP2a = fP2.w * invaera;
1422 const float fP3a = fP3.w * invaera;
1424 const float dw = (dx1 * fP1a) + (dx2 * fP2a) + (dx3 * fP3a);
1426 const RGBf& cf = (
RGBf)data.facecolor;
1427 const int fPR = (
int)(256 * cf.
R);
1428 const int fPG = (int)(256 * cf.
G);
1429 const int fPB = (int)(256 * cf.
B);
1436 const color_t* tex = data.tex->data();
1437 const int32_t texsize_x = data.tex->width();
1438 const int32_t texsize_y = data.tex->height();
1439 const int32_t texsize_x_mm = texsize_x - 1;
1440 const int32_t texsize_y_mm = texsize_y - 1;
1441 const int32_t texstride = data.tex->stride();
1454 const float dtx = ((T1.
x * dx1) + (T2.
x * dx2) + (T3.
x * dx3));
1455 const float dty = ((T1.
y * dx1) + (T2.
y * dx2) + (T3.
y * dx3));
1457 while ((uintptr_t)(buf) < end)
1463 bx = (-O1 + dx1 - 1) / dx1;
1469 if (dy2 <= 0)
return;
1470 const int32_t by = (-O2 + dy2 - 1) / dy2;
1474 const int32_t offs = by * stride;
1479 bx =
max(bx, ((-O2 + dx2 - 1) / dx2));
1485 if (dy3 <= 0)
return;
1486 const int32_t by = (-O3 + dy3 - 1) / dy3;
1490 const int32_t offs = by * stride;
1495 bx =
max(bx, ((-O3 + dx3 - 1) / dx3));
1498 int32_t C1 = O1 + (dx1 * bx) + E;
1499 int32_t C2 = O2 + (dx2 * bx);
1500 int32_t C3 = O3 + (dx3 * bx);
1501 float cw = ((C1 * fP1a) + (C2 * fP2a) + (C3 * fP3a));
1503 float tx = ((T1.
x * C1) + (T2.
x * C2) + (T3.
x * C3));
1504 float ty = ((T1.
y * C1) + (T2.
y * C2) + (T3.
y * C3));
1506 while ((bx < lx) && ((C2 | C3) >= 0))
1508 ZBUFFER_t& W = zbuf[bx];
1509 const ZBUFFER_t aa = (std::is_same<ZBUFFER_t, uint16_t>::value) ? ((ZBUFFER_t)(cw * wa + wb)) : ((ZBUFFER_t)cw);
1515 if (TEXTURE_BILINEAR)
1517 const float xx = tx;
1518 const float yy = ty;
1519 const int ttx = (int)floorf(xx);
1520 const int tty = (int)floorf(yy);
1521 const float ax = xx - ttx;
1522 const float ay = yy - tty;
1523 const int minx = (TEXTURE_WRAP ? (ttx & (texsize_x_mm)) :
shaderclip(ttx, texsize_x_mm));
1524 const int maxx = (TEXTURE_WRAP ? ((ttx + 1) & (texsize_x_mm)) :
shaderclip(ttx + 1, texsize_x_mm));
1525 const int miny = (TEXTURE_WRAP ? ((tty & (texsize_y_mm)) * texstride) :
shaderclip(tty, texsize_y_mm) * texstride);
1526 const int maxy = (TEXTURE_WRAP ? (((tty + 1) & (texsize_y_mm)) * texstride) :
shaderclip(tty + 1, texsize_y_mm) * texstride);
1531 const int ttx = (TEXTURE_WRAP ? ((int)((tx))) & (texsize_x_mm) :
shaderclip((
int)(tx), texsize_x_mm));
1532 const int tty = (TEXTURE_WRAP ? ((int)((ty))) & (texsize_y_mm) :
shaderclip((
int)(ty), texsize_y_mm));
1533 col = tex[ttx + (tty)*texstride];
1536 col.mult256(fPR, fPG, fPB);
1563 template<
typename color_t,
typename ZBUFFER_t,
bool TEXTURE_BILINEAR,
bool TEXTURE_WRAP>
1565 const int32_t dx1,
const int32_t dy1, int32_t O1,
const RasterizerVec4& fP1,
1566 const int32_t dx2,
const int32_t dy2, int32_t O2,
const RasterizerVec4& fP2,
1567 const int32_t dx3,
const int32_t dy3, int32_t O3,
const RasterizerVec4& fP3,
1568 const RasterizerParams<color_t, color_t, ZBUFFER_t>& data)
1570 color_t* buf = data.im->data() + offset;
1571 ZBUFFER_t* zbuf = data.zbuf + offset;
1573 const float wa = data.wa;
1574 const float wb = data.wb;
1578 const int32_t stride = data.im->stride();
1579 const int32_t zstride = data.im->lx();
1581 const uintptr_t end = (uintptr_t)(buf + (ly * stride));
1582 const int32_t pa = O1 + O2 + O3;
1583 const int32_t E = ((pa == 0) ? 1 : 0);
1584 const int32_t aera = pa + E;
1586 const float invaera =
fast_inv((
float)aera);
1587 const float fP1a = fP1.w * invaera;
1588 const float fP2a = fP2.w * invaera;
1589 const float fP3a = fP3.w * invaera;
1591 const float dw = (dx1 * fP1a) + (dx2 * fP2a) + (dx3 * fP3a);
1596 const int fP1R = (
int)(256 * cf1.
R);
1597 const int fP1G = (int)(256 * cf1.
G);
1598 const int fP1B = (int)(256 * cf1.
B);
1599 const int fP21R = (int)(256 * (cf2.R - cf1.
R));
1600 const int fP21G = (int)(256 * (cf2.G - cf1.
G));
1601 const int fP21B = (int)(256 * (cf2.B - cf1.
B));
1602 const int fP31R = (int)(256 * (cf3.
R - cf1.
R));
1603 const int fP31G = (int)(256 * (cf3.
G - cf1.
G));
1604 const int fP31B = (int)(256 * (cf3.
B - cf1.
B));
1611 const color_t* tex = data.tex->data();
1612 const int32_t texsize_x = data.tex->width();
1613 const int32_t texsize_y = data.tex->height();
1614 const int32_t texsize_x_mm = texsize_x - 1;
1615 const int32_t texsize_y_mm = texsize_y - 1;
1616 const int32_t texstride = data.tex->stride();
1629 const float dtx = ((T1.
x * dx1) + (T2.
x * dx2) + (T3.
x * dx3));
1630 const float dty = ((T1.
y * dx1) + (T2.
y * dx2) + (T3.
y * dx3));
1632 while ((uintptr_t)(buf) < end)
1638 bx = (-O1 + dx1 - 1) / dx1;
1644 if (dy2 <= 0)
return;
1645 const int32_t by = (-O2 + dy2 - 1) / dy2;
1649 const int32_t offs = by * stride;
1654 bx =
max(bx, ((-O2 + dx2 - 1) / dx2));
1660 if (dy3 <= 0)
return;
1661 const int32_t by = (-O3 + dy3 - 1) / dy3;
1665 const int32_t offs = by * stride;
1670 bx =
max(bx, ((-O3 + dx3 - 1) / dx3));
1673 int32_t C1 = O1 + (dx1 * bx) + E;
1674 int32_t C2 = O2 + (dx2 * bx);
1675 int32_t C3 = O3 + (dx3 * bx);
1676 float cw = ((C1 * fP1a) + (C2 * fP2a) + (C3 * fP3a));
1678 float tx = ((T1.
x * C1) + (T2.
x * C2) + (T3.
x * C3));
1679 float ty = ((T1.
y * C1) + (T2.
y * C2) + (T3.
y * C3));
1681 while ((bx < lx) && ((C2 | C3) >= 0))
1683 ZBUFFER_t& W = zbuf[bx];
1684 const ZBUFFER_t aa = (std::is_same<ZBUFFER_t, uint16_t>::value) ? ((ZBUFFER_t)(cw * wa + wb)) : ((ZBUFFER_t)cw);
1690 if (TEXTURE_BILINEAR)
1692 const float xx = tx;
1693 const float yy = ty;
1694 const int ttx = (int)floorf(xx);
1695 const int tty = (int)floorf(yy);
1696 const float ax = xx - ttx;
1697 const float ay = yy - tty;
1698 const int minx = (TEXTURE_WRAP ? (ttx & (texsize_x_mm)) :
shaderclip(ttx, texsize_x_mm));
1699 const int maxx = (TEXTURE_WRAP ? ((ttx + 1) & (texsize_x_mm)) :
shaderclip(ttx + 1, texsize_x_mm));
1700 const int miny = (TEXTURE_WRAP ? ((tty & (texsize_y_mm)) * texstride) :
shaderclip(tty, texsize_y_mm) * texstride);
1701 const int maxy = (TEXTURE_WRAP ? (((tty + 1) & (texsize_y_mm)) * texstride) :
shaderclip(tty + 1, texsize_y_mm) * texstride);
1706 const int ttx = (TEXTURE_WRAP ? ((int)((tx))) & (texsize_x_mm) :
shaderclip((
int)(tx), texsize_x_mm));
1707 const int tty = (TEXTURE_WRAP ? ((int)((ty))) & (texsize_y_mm) :
shaderclip((
int)(ty), texsize_y_mm));
1708 col = tex[ttx + (tty)*texstride];
1711 const int r = fP1R + ((C2 * fP21R + C3 * fP31R) / aera);
1712 const int g = fP1G + ((C2 * fP21G + C3 * fP31G) / aera);
1713 const int b = fP1B + ((C2 * fP21B + C3 * fP31B) / aera);
1715 col.mult256(r, g, b);
1744 template<
int SHADER_FLAGS_ENABLED,
typename color_t,
typename ZBUFFER_t>
void shader_select(
const int32_t& offset,
const int32_t& lx,
const int32_t& ly,
1745 const int32_t dx1,
const int32_t dy1, int32_t O1,
const RasterizerVec4& fP1,
1746 const int32_t dx2,
const int32_t dy2, int32_t O2,
const RasterizerVec4& fP2,
1747 const int32_t dx3,
const int32_t dy3, int32_t O3,
const RasterizerVec4& fP3,
1748 const RasterizerParams<color_t, color_t, ZBUFFER_t> & data)
1750 int raster_type = data.shader_type;
1751 if (TGX_SHADER_HAS_ZBUFFER(SHADER_FLAGS_ENABLED) && (TGX_SHADER_HAS_ZBUFFER(raster_type)))
1753 if (TGX_SHADER_HAS_ORTHO(SHADER_FLAGS_ENABLED) && (TGX_SHADER_HAS_ORTHO(raster_type)))
1755 if (TGX_SHADER_HAS_TEXTURE(SHADER_FLAGS_ENABLED) && TGX_SHADER_HAS_TEXTURE(raster_type))
1757 if (TGX_SHADER_HAS_GOURAUD(SHADER_FLAGS_ENABLED) && TGX_SHADER_HAS_GOURAUD(raster_type))
1759 if (TGX_SHADER_HAS_TEXTURE_BILINEAR(SHADER_FLAGS_ENABLED) && TGX_SHADER_HAS_TEXTURE_BILINEAR(raster_type))
1761 if (TGX_SHADER_HAS_TEXTURE_CLAMP(SHADER_FLAGS_ENABLED) && TGX_SHADER_HAS_TEXTURE_CLAMP(raster_type))
1762 shader_Gouraud_Texture_Zbuffer_Ortho<color_t,ZBUFFER_t, true,false>(offset, lx, ly, dx1, dy1, O1, fP1, dx2, dy2, O2, fP2, dx3, dy3, O3, fP3, data);
1763 else if (TGX_SHADER_HAS_TEXTURE_WRAP_POW2(SHADER_FLAGS_ENABLED))
1764 shader_Gouraud_Texture_Zbuffer_Ortho<color_t, ZBUFFER_t, true, true>(offset, lx, ly, dx1, dy1, O1, fP1, dx2, dy2, O2, fP2, dx3, dy3, O3, fP3, data);
1766 else if (TGX_SHADER_HAS_TEXTURE_NEAREST(SHADER_FLAGS_ENABLED))
1768 if (TGX_SHADER_HAS_TEXTURE_CLAMP(SHADER_FLAGS_ENABLED) && TGX_SHADER_HAS_TEXTURE_CLAMP(raster_type))
1769 shader_Gouraud_Texture_Zbuffer_Ortho<color_t, ZBUFFER_t, false,false>(offset, lx, ly, dx1, dy1, O1, fP1, dx2, dy2, O2, fP2, dx3, dy3, O3, fP3, data);
1770 else if (TGX_SHADER_HAS_TEXTURE_WRAP_POW2(SHADER_FLAGS_ENABLED))
1771 shader_Gouraud_Texture_Zbuffer_Ortho<color_t, ZBUFFER_t, false,true>(offset, lx, ly, dx1, dy1, O1, fP1, dx2, dy2, O2, fP2, dx3, dy3, O3, fP3, data);
1774 else if (TGX_SHADER_HAS_FLAT(SHADER_FLAGS_ENABLED))
1776 if (TGX_SHADER_HAS_TEXTURE_BILINEAR(SHADER_FLAGS_ENABLED) && TGX_SHADER_HAS_TEXTURE_BILINEAR(raster_type))
1778 if (TGX_SHADER_HAS_TEXTURE_CLAMP(SHADER_FLAGS_ENABLED) && TGX_SHADER_HAS_TEXTURE_CLAMP(raster_type))
1779 shader_Flat_Texture_Zbuffer_Ortho<color_t, ZBUFFER_t, true,false>(offset, lx, ly, dx1, dy1, O1, fP1, dx2, dy2, O2, fP2, dx3, dy3, O3, fP3, data);
1780 else if (TGX_SHADER_HAS_TEXTURE_WRAP_POW2(SHADER_FLAGS_ENABLED))
1781 shader_Flat_Texture_Zbuffer_Ortho<color_t, ZBUFFER_t, true,true>(offset, lx, ly, dx1, dy1, O1, fP1, dx2, dy2, O2, fP2, dx3, dy3, O3, fP3, data);
1783 else if (TGX_SHADER_HAS_TEXTURE_NEAREST(SHADER_FLAGS_ENABLED))
1785 if (TGX_SHADER_HAS_TEXTURE_CLAMP(SHADER_FLAGS_ENABLED) && TGX_SHADER_HAS_TEXTURE_CLAMP(raster_type))
1786 shader_Flat_Texture_Zbuffer_Ortho<color_t, ZBUFFER_t, false,false>(offset, lx, ly, dx1, dy1, O1, fP1, dx2, dy2, O2, fP2, dx3, dy3, O3, fP3, data);
1787 else if (TGX_SHADER_HAS_TEXTURE_WRAP_POW2(SHADER_FLAGS_ENABLED))
1788 shader_Flat_Texture_Zbuffer_Ortho<color_t, ZBUFFER_t, false,true>(offset, lx, ly, dx1, dy1, O1, fP1, dx2, dy2, O2, fP2, dx3, dy3, O3, fP3, data);
1792 else if (TGX_SHADER_HAS_NOTEXTURE(SHADER_FLAGS_ENABLED))
1794 if (TGX_SHADER_HAS_GOURAUD(SHADER_FLAGS_ENABLED) && TGX_SHADER_HAS_GOURAUD(raster_type))
1795 shader_Gouraud_Zbuffer<color_t, ZBUFFER_t>(offset, lx, ly, dx1, dy1, O1, fP1, dx2, dy2, O2, fP2, dx3, dy3, O3, fP3, data);
1796 else if (TGX_SHADER_HAS_FLAT(SHADER_FLAGS_ENABLED))
1797 shader_Flat_Zbuffer<color_t, ZBUFFER_t>(offset, lx, ly, dx1, dy1, O1, fP1, dx2, dy2, O2, fP2, dx3, dy3, O3, fP3, data);
1800 else if (TGX_SHADER_HAS_PERSPECTIVE(SHADER_FLAGS_ENABLED))
1802 if (TGX_SHADER_HAS_TEXTURE(SHADER_FLAGS_ENABLED) && TGX_SHADER_HAS_TEXTURE(raster_type))
1804 if (TGX_SHADER_HAS_GOURAUD(SHADER_FLAGS_ENABLED) && TGX_SHADER_HAS_GOURAUD(raster_type))
1806 if (TGX_SHADER_HAS_TEXTURE_BILINEAR(SHADER_FLAGS_ENABLED) && TGX_SHADER_HAS_TEXTURE_BILINEAR(raster_type))
1808 if (TGX_SHADER_HAS_TEXTURE_CLAMP(SHADER_FLAGS_ENABLED) && TGX_SHADER_HAS_TEXTURE_CLAMP(raster_type))
1809 shader_Gouraud_Texture_Zbuffer<color_t, ZBUFFER_t, true,false>(offset, lx, ly, dx1, dy1, O1, fP1, dx2, dy2, O2, fP2, dx3, dy3, O3, fP3, data);
1810 else if (TGX_SHADER_HAS_TEXTURE_WRAP_POW2(SHADER_FLAGS_ENABLED))
1811 shader_Gouraud_Texture_Zbuffer<color_t, ZBUFFER_t, true, true>(offset, lx, ly, dx1, dy1, O1, fP1, dx2, dy2, O2, fP2, dx3, dy3, O3, fP3, data);
1813 else if (TGX_SHADER_HAS_TEXTURE_NEAREST(SHADER_FLAGS_ENABLED))
1815 if (TGX_SHADER_HAS_TEXTURE_CLAMP(SHADER_FLAGS_ENABLED) && TGX_SHADER_HAS_TEXTURE_CLAMP(raster_type))
1816 shader_Gouraud_Texture_Zbuffer<color_t, ZBUFFER_t, false,false>(offset, lx, ly, dx1, dy1, O1, fP1, dx2, dy2, O2, fP2, dx3, dy3, O3, fP3, data);
1817 else if (TGX_SHADER_HAS_TEXTURE_WRAP_POW2(SHADER_FLAGS_ENABLED))
1818 shader_Gouraud_Texture_Zbuffer<color_t, ZBUFFER_t, false,true>(offset, lx, ly, dx1, dy1, O1, fP1, dx2, dy2, O2, fP2, dx3, dy3, O3, fP3, data);
1821 else if (TGX_SHADER_HAS_FLAT(SHADER_FLAGS_ENABLED))
1823 if (TGX_SHADER_HAS_TEXTURE_BILINEAR(SHADER_FLAGS_ENABLED) && TGX_SHADER_HAS_TEXTURE_BILINEAR(raster_type))
1825 if (TGX_SHADER_HAS_TEXTURE_CLAMP(SHADER_FLAGS_ENABLED) && TGX_SHADER_HAS_TEXTURE_CLAMP(raster_type))
1826 shader_Flat_Texture_Zbuffer<color_t, ZBUFFER_t, true,false>(offset, lx, ly, dx1, dy1, O1, fP1, dx2, dy2, O2, fP2, dx3, dy3, O3, fP3, data);
1827 else if (TGX_SHADER_HAS_TEXTURE_WRAP_POW2(SHADER_FLAGS_ENABLED))
1828 shader_Flat_Texture_Zbuffer<color_t, ZBUFFER_t, true,true>(offset, lx, ly, dx1, dy1, O1, fP1, dx2, dy2, O2, fP2, dx3, dy3, O3, fP3, data);
1830 else if (TGX_SHADER_HAS_TEXTURE_NEAREST(SHADER_FLAGS_ENABLED))
1832 if (TGX_SHADER_HAS_TEXTURE_CLAMP(SHADER_FLAGS_ENABLED) && TGX_SHADER_HAS_TEXTURE_CLAMP(raster_type))
1833 shader_Flat_Texture_Zbuffer<color_t, ZBUFFER_t, false,false>(offset, lx, ly, dx1, dy1, O1, fP1, dx2, dy2, O2, fP2, dx3, dy3, O3, fP3, data);
1834 else if (TGX_SHADER_HAS_TEXTURE_WRAP_POW2(SHADER_FLAGS_ENABLED))
1835 shader_Flat_Texture_Zbuffer<color_t, ZBUFFER_t, false,true>(offset, lx, ly, dx1, dy1, O1, fP1, dx2, dy2, O2, fP2, dx3, dy3, O3, fP3, data);
1839 else if (TGX_SHADER_HAS_NOTEXTURE(SHADER_FLAGS_ENABLED))
1841 if (TGX_SHADER_HAS_GOURAUD(SHADER_FLAGS_ENABLED) && TGX_SHADER_HAS_GOURAUD(raster_type))
1842 shader_Gouraud_Zbuffer<color_t, ZBUFFER_t>(offset, lx, ly, dx1, dy1, O1, fP1, dx2, dy2, O2, fP2, dx3, dy3, O3, fP3, data);
1843 else if (TGX_SHADER_HAS_FLAT(SHADER_FLAGS_ENABLED))
1844 shader_Flat_Zbuffer<color_t, ZBUFFER_t>(offset, lx, ly, dx1, dy1, O1, fP1, dx2, dy2, O2, fP2, dx3, dy3, O3, fP3, data);
1848 else if (TGX_SHADER_HAS_NOZBUFFER(SHADER_FLAGS_ENABLED))
1850 if (TGX_SHADER_HAS_ORTHO(SHADER_FLAGS_ENABLED) && (TGX_SHADER_HAS_ORTHO(raster_type)))
1852 if (TGX_SHADER_HAS_TEXTURE(SHADER_FLAGS_ENABLED) && TGX_SHADER_HAS_TEXTURE(raster_type))
1854 if (TGX_SHADER_HAS_GOURAUD(SHADER_FLAGS_ENABLED) && TGX_SHADER_HAS_GOURAUD(raster_type))
1856 if (TGX_SHADER_HAS_TEXTURE_BILINEAR(SHADER_FLAGS_ENABLED) && TGX_SHADER_HAS_TEXTURE_BILINEAR(raster_type))
1858 if (TGX_SHADER_HAS_TEXTURE_CLAMP(SHADER_FLAGS_ENABLED) && TGX_SHADER_HAS_TEXTURE_CLAMP(raster_type))
1859 shader_Gouraud_Texture_Ortho<color_t, ZBUFFER_t, true,false>(offset, lx, ly, dx1, dy1, O1, fP1, dx2, dy2, O2, fP2, dx3, dy3, O3, fP3, data);
1860 else if (TGX_SHADER_HAS_TEXTURE_WRAP_POW2(SHADER_FLAGS_ENABLED))
1861 shader_Gouraud_Texture_Ortho<color_t, ZBUFFER_t, true,true>(offset, lx, ly, dx1, dy1, O1, fP1, dx2, dy2, O2, fP2, dx3, dy3, O3, fP3, data);
1863 else if (TGX_SHADER_HAS_TEXTURE_NEAREST(SHADER_FLAGS_ENABLED))
1865 if (TGX_SHADER_HAS_TEXTURE_CLAMP(SHADER_FLAGS_ENABLED) && TGX_SHADER_HAS_TEXTURE_CLAMP(raster_type))
1866 shader_Gouraud_Texture_Ortho<color_t, ZBUFFER_t, false,false>(offset, lx, ly, dx1, dy1, O1, fP1, dx2, dy2, O2, fP2, dx3, dy3, O3, fP3, data);
1867 else if (TGX_SHADER_HAS_TEXTURE_WRAP_POW2(SHADER_FLAGS_ENABLED))
1868 shader_Gouraud_Texture_Ortho<color_t, ZBUFFER_t, false,true>(offset, lx, ly, dx1, dy1, O1, fP1, dx2, dy2, O2, fP2, dx3, dy3, O3, fP3, data);
1871 else if (TGX_SHADER_HAS_FLAT(SHADER_FLAGS_ENABLED))
1873 if (TGX_SHADER_HAS_TEXTURE_BILINEAR(SHADER_FLAGS_ENABLED) && TGX_SHADER_HAS_TEXTURE_BILINEAR(raster_type))
1875 if (TGX_SHADER_HAS_TEXTURE_CLAMP(SHADER_FLAGS_ENABLED) && TGX_SHADER_HAS_TEXTURE_CLAMP(raster_type))
1876 shader_Flat_Texture_Ortho<color_t, ZBUFFER_t, true,false>(offset, lx, ly, dx1, dy1, O1, fP1, dx2, dy2, O2, fP2, dx3, dy3, O3, fP3, data);
1877 else if (TGX_SHADER_HAS_TEXTURE_WRAP_POW2(SHADER_FLAGS_ENABLED))
1878 shader_Flat_Texture_Ortho<color_t, ZBUFFER_t, true,true>(offset, lx, ly, dx1, dy1, O1, fP1, dx2, dy2, O2, fP2, dx3, dy3, O3, fP3, data);
1880 else if (TGX_SHADER_HAS_TEXTURE_NEAREST(SHADER_FLAGS_ENABLED))
1882 if (TGX_SHADER_HAS_TEXTURE_CLAMP(SHADER_FLAGS_ENABLED) && TGX_SHADER_HAS_TEXTURE_CLAMP(raster_type))
1883 shader_Flat_Texture_Ortho<color_t, ZBUFFER_t, false,false>(offset, lx, ly, dx1, dy1, O1, fP1, dx2, dy2, O2, fP2, dx3, dy3, O3, fP3, data);
1884 else if (TGX_SHADER_HAS_TEXTURE_WRAP_POW2(SHADER_FLAGS_ENABLED))
1885 shader_Flat_Texture_Ortho<color_t, ZBUFFER_t, false,true>(offset, lx, ly, dx1, dy1, O1, fP1, dx2, dy2, O2, fP2, dx3, dy3, O3, fP3, data);
1889 else if (TGX_SHADER_HAS_NOTEXTURE(SHADER_FLAGS_ENABLED))
1891 if (TGX_SHADER_HAS_GOURAUD(SHADER_FLAGS_ENABLED) && TGX_SHADER_HAS_GOURAUD(raster_type))
1892 shader_Gouraud<color_t, ZBUFFER_t>(offset, lx, ly, dx1, dy1, O1, fP1, dx2, dy2, O2, fP2, dx3, dy3, O3, fP3, data);
1893 else if (TGX_SHADER_HAS_FLAT(SHADER_FLAGS_ENABLED))
1894 shader_Flat<color_t, ZBUFFER_t>(offset, lx, ly, dx1, dy1, O1, fP1, dx2, dy2, O2, fP2, dx3, dy3, O3, fP3, data);
1897 else if (TGX_SHADER_HAS_PERSPECTIVE(SHADER_FLAGS_ENABLED))
1899 if (TGX_SHADER_HAS_TEXTURE(SHADER_FLAGS_ENABLED) && TGX_SHADER_HAS_TEXTURE(raster_type))
1901 if (TGX_SHADER_HAS_GOURAUD(SHADER_FLAGS_ENABLED) && TGX_SHADER_HAS_GOURAUD(raster_type))
1903 if (TGX_SHADER_HAS_TEXTURE_BILINEAR(SHADER_FLAGS_ENABLED) && TGX_SHADER_HAS_TEXTURE_BILINEAR(raster_type))
1905 if (TGX_SHADER_HAS_TEXTURE_CLAMP(SHADER_FLAGS_ENABLED) && TGX_SHADER_HAS_TEXTURE_CLAMP(raster_type))
1906 shader_Gouraud_Texture<color_t, ZBUFFER_t, true, false>(offset, lx, ly, dx1, dy1, O1, fP1, dx2, dy2, O2, fP2, dx3, dy3, O3, fP3, data);
1907 else if (TGX_SHADER_HAS_TEXTURE_WRAP_POW2(SHADER_FLAGS_ENABLED))
1908 shader_Gouraud_Texture<color_t, ZBUFFER_t, true, true>(offset, lx, ly, dx1, dy1, O1, fP1, dx2, dy2, O2, fP2, dx3, dy3, O3, fP3, data);
1910 else if (TGX_SHADER_HAS_TEXTURE_NEAREST(SHADER_FLAGS_ENABLED))
1912 if (TGX_SHADER_HAS_TEXTURE_CLAMP(SHADER_FLAGS_ENABLED) && TGX_SHADER_HAS_TEXTURE_CLAMP(raster_type))
1913 shader_Gouraud_Texture<color_t, ZBUFFER_t, false, false>(offset, lx, ly, dx1, dy1, O1, fP1, dx2, dy2, O2, fP2, dx3, dy3, O3, fP3, data);
1914 else if (TGX_SHADER_HAS_TEXTURE_WRAP_POW2(SHADER_FLAGS_ENABLED))
1915 shader_Gouraud_Texture<color_t, ZBUFFER_t, false, true>(offset, lx, ly, dx1, dy1, O1, fP1, dx2, dy2, O2, fP2, dx3, dy3, O3, fP3, data);
1918 else if (TGX_SHADER_HAS_FLAT(SHADER_FLAGS_ENABLED))
1920 if (TGX_SHADER_HAS_TEXTURE_BILINEAR(SHADER_FLAGS_ENABLED) && TGX_SHADER_HAS_TEXTURE_BILINEAR(raster_type))
1922 if (TGX_SHADER_HAS_TEXTURE_CLAMP(SHADER_FLAGS_ENABLED) && TGX_SHADER_HAS_TEXTURE_CLAMP(raster_type))
1923 shader_Flat_Texture<color_t, ZBUFFER_t, true, false>(offset, lx, ly, dx1, dy1, O1, fP1, dx2, dy2, O2, fP2, dx3, dy3, O3, fP3, data);
1924 else if (TGX_SHADER_HAS_TEXTURE_WRAP_POW2(SHADER_FLAGS_ENABLED))
1925 shader_Flat_Texture<color_t, ZBUFFER_t, true, true>(offset, lx, ly, dx1, dy1, O1, fP1, dx2, dy2, O2, fP2, dx3, dy3, O3, fP3, data);
1927 else if (TGX_SHADER_HAS_TEXTURE_NEAREST(SHADER_FLAGS_ENABLED))
1929 if (TGX_SHADER_HAS_TEXTURE_CLAMP(SHADER_FLAGS_ENABLED) && TGX_SHADER_HAS_TEXTURE_CLAMP(raster_type))
1930 shader_Flat_Texture<color_t, ZBUFFER_t, false, false>(offset, lx, ly, dx1, dy1, O1, fP1, dx2, dy2, O2, fP2, dx3, dy3, O3, fP3, data);
1931 else if (TGX_SHADER_HAS_TEXTURE_WRAP_POW2(SHADER_FLAGS_ENABLED))
1932 shader_Flat_Texture<color_t, ZBUFFER_t, false, true>(offset, lx, ly, dx1, dy1, O1, fP1, dx2, dy2, O2, fP2, dx3, dy3, O3, fP3, data);
1936 else if (TGX_SHADER_HAS_NOTEXTURE(SHADER_FLAGS_ENABLED))
1938 if (TGX_SHADER_HAS_GOURAUD(SHADER_FLAGS_ENABLED) && TGX_SHADER_HAS_GOURAUD(raster_type))
1939 shader_Gouraud<color_t, ZBUFFER_t>(offset, lx, ly, dx1, dy1, O1, fP1, dx2, dy2, O2, fP2, dx3, dy3, O3, fP3, data);
1940 else if (TGX_SHADER_HAS_FLAT(SHADER_FLAGS_ENABLED))
1941 shader_Flat<color_t, ZBUFFER_t>(offset, lx, ly, dx1, dy1, O1, fP1, dx2, dy2, O2, fP2, dx3, dy3, O3, fP3, data);
1954 template<
bool USE_BLENDING,
typename color_t_im>
1956 const int32_t dx1,
const int32_t dy1, int32_t O1,
const RasterizerVec4& fP1,
1957 const int32_t dx2,
const int32_t dy2, int32_t O2,
const RasterizerVec4& fP2,
1958 const int32_t dx3,
const int32_t dy3, int32_t O3,
const RasterizerVec4& fP3,
1959 const RasterizerParams<color_t_im, color_t_im, float> & data)
1961 color_t_im * buf = data.im->data() + offset;
1962 const int32_t stride = data.im->stride();
1965 const RGB32 col1 =
RGB64(fP1.color.R, fP1.color.G, fP1.color.B, fP1.A);
1966 const RGB32 col2 =
RGB64(fP2.color.R, fP2.color.G, fP2.color.B, fP2.A);
1967 const RGB32 col3 =
RGB64(fP3.color.R, fP3.color.G, fP3.color.B, fP3.A);
1969 const uintptr_t end = (uintptr_t)(buf + (ly * stride));
1970 const int32_t pa = O1 + O2 + O3;
1971 const int32_t E = ((pa == 0) ? 1 : 0);
1972 const int32_t aera = pa + E;
1973 const int shiftC = (aera > (1 << 22)) ? 10 : 0;
1975 while ((uintptr_t)(buf) < end)
1981 bx = (-O1 + dx1 - 1) / dx1;
1987 if (dy2 <= 0)
return;
1988 const int32_t by = (-O2 + dy2 - 1) / dy2;
1992 const int32_t offs = by * stride;
1996 bx =
max(bx, ((-O2 + dx2 - 1) / dx2));
2002 if (dy3 <= 0)
return;
2003 const int32_t by = (-O3 + dy3 - 1) / dy3;
2007 const int32_t offs = by * stride;
2011 bx =
max(bx, ((-O3 + dx3 - 1) / dx3));
2014 int32_t C2 = O2 + (dx2 * bx);
2015 int32_t C3 = O3 + (dx3 * bx);
2016 while ((bx < lx) && ((C2 | C3) >= 0))
2022 buf[bx] = color_t_im(c);
2045 template<
bool USE_BLENDING,
bool USE_MASKING,
bool USE_GRADIENT,
typename color_t_im,
typename color_t_tex>
2047 const int32_t dx1,
const int32_t dy1, int32_t O1,
const RasterizerVec4& fP1,
2048 const int32_t dx2,
const int32_t dy2, int32_t O2,
const RasterizerVec4& fP2,
2049 const int32_t dx3,
const int32_t dy3, int32_t O3,
const RasterizerVec4& fP3,
2050 const RasterizerParams<color_t_im, color_t_tex, float> & data)
2053 color_t_im * buf = data.im->data() + offset;
2054 const int32_t stride = data.im->stride();
2056 const uintptr_t end = (uintptr_t)(buf + (ly * stride));
2057 const int32_t pa = O1 + O2 + O3;
2058 const int32_t E = ((pa == 0) ? 1 : 0);
2059 const int32_t aera = pa + E;
2061 const float invaera =
fast_inv((
float)aera);
2063 const color_t_tex mask_color = data.mask_color;
2074 const color_t_tex * tex = data.tex->data();
2075 const int32_t texsize_x = data.tex->width();
2076 const int32_t texsize_y = data.tex->height();
2077 const int32_t texsize_x_mm = data.tex->width() - 1;
2078 const int32_t texsize_y_mm = data.tex->height() - 1;
2079 const int32_t texstride = data.tex->stride();
2092 const float dtx = ((T1.x * dx1) + (T2.x * dx2) + (T3.x * dx3));
2093 const float dty = ((T1.y * dx1) + (T2.y * dx2) + (T3.y * dx3));
2095 while ((uintptr_t)(buf) < end)
2101 bx = (-O1 + dx1 - 1) / dx1;
2107 if (dy2 <= 0)
return;
2108 const int32_t by = (-O2 + dy2 - 1) / dy2;
2112 const int32_t offs = by * stride;
2116 bx =
max(bx, ((-O2 + dx2 - 1) / dx2));
2122 if (dy3 <= 0)
return;
2123 const int32_t by = (-O3 + dy3 - 1) / dy3;
2127 const int32_t offs = by * stride;
2131 bx =
max(bx, ((-O3 + dx3 - 1) / dx3));
2134 int32_t C1 = O1 + (dx1 * bx) + E;
2135 int32_t C2 = O2 + (dx2 * bx);
2136 int32_t C3 = O3 + (dx3 * bx);
2138 float tx = ((T1.x * C1) + (T2.x * C2) + (T3.x * C3)) - 0.5f;
2139 float ty = ((T1.y * C1) + (T2.y * C2) + (T3.y * C3)) - 0.5f;
2141 while ((bx < lx) && ((C2 | C3) >= 0))
2143 const float xx = tx;
2144 const float yy = ty;
2145 const int ttx = (int)floorf(xx);
2146 const int tty = (int)floorf(yy);
2147 const float ax = xx - ttx;
2148 const float ay = yy - tty;
2150 const int minx =
shaderclip(ttx, texsize_x_mm);
2151 const int maxx =
shaderclip(ttx + 1, texsize_x_mm);
2152 const int miny =
shaderclip(tty, texsize_y_mm) * texstride;
2153 const int maxy =
shaderclip(tty + 1, texsize_y_mm) * texstride;
2157 auto col00 = tex[minx + miny];
2160 auto col10 = tex[maxx + miny];
2163 auto col01 = tex[minx + maxy];
2166 auto col11 = tex[maxx + maxy];
2175 const int sC1 = aera - C3 - C2;
2176 const float m = 256.0f / aera;
2177 const int r = (int)((sC1 * cf1.
R + sC2 * cf2.R + sC3 * cf3.
R) * m);
2178 const int g = (int)((sC1 * cf1.
G + sC2 * cf2.G + sC3 * cf3.
G) * m);
2179 const int b = (int)((sC1 * cf1.
B + sC2 * cf2.B + sC3 * cf3.
B) * m);
2180 const int a = (int)((sC1 * fP1.A + sC2 * fP2.A + sC3 * fP3.A) * m);
2187 buf[bx] = color_t_im(c);
2191 buf[bx] = color_t_im(col);
2196 color_t_tex col =
interpolateColorsBilinear(tex[minx + miny], tex[maxx + miny], tex[minx + maxy], tex[maxx + maxy], ax, ay);
2201 const int sC1 = aera - C3 - C2;
2202 const float m = 256.0f / aera;
2203 const int r = (int)((sC1 * cf1.
R + sC2 * cf2.R + sC3 * cf3.
R) * m);
2204 const int g = (int)((sC1 * cf1.
G + sC2 * cf2.G + sC3 * cf3.
G) * m);
2205 const int b = (int)((sC1 * cf1.
B + sC2 * cf2.B + sC3 * cf3.
B) * m);
2206 const int a = (int)((sC1 * fP1.A + sC2 * fP2.A + sC3 * fP3.A) * m);
2207 col.mult256(r, g, b, a);
2211 color_t_tex c = color_t_tex(buf[bx]);
2212 c.blend(col, data.opacity);
2213 buf[bx] = color_t_im(c);
2217 buf[bx] = color_t_im(col);
2243 template<
typename BLEND_OP,
typename color_t_im,
typename color_t_tex>
2245 const int32_t dx1,
const int32_t dy1, int32_t O1,
const RasterizerVec4& fP1,
2246 const int32_t dx2,
const int32_t dy2, int32_t O2,
const RasterizerVec4& fP2,
2247 const int32_t dx3,
const int32_t dy3, int32_t O3,
const RasterizerVec4& fP3,
2248 const RasterizerParams<color_t_im, color_t_tex, float, BLEND_OP> & data)
2251 color_t_im * buf = data.im->data() + offset;
2252 const int32_t stride = data.im->stride();
2254 const uintptr_t end = (uintptr_t)(buf + (ly * stride));
2255 const int32_t pa = O1 + O2 + O3;
2256 const int32_t E = ((pa == 0) ? 1 : 0);
2257 const int32_t aera = pa + E;
2259 const float invaera =
fast_inv((
float)aera);
2267 const color_t_tex * tex = data.tex->data();
2268 const int32_t texsize_x = data.tex->width();
2269 const int32_t texsize_y = data.tex->height();
2270 const int32_t texsize_x_mm = data.tex->width() - 1;
2271 const int32_t texsize_y_mm = data.tex->height() - 1;
2272 const int32_t texstride = data.tex->stride();
2285 const float dtx = ((T1.
x * dx1) + (T2.
x * dx2) + (T3.
x * dx3));
2286 const float dty = ((T1.
y * dx1) + (T2.
y * dx2) + (T3.
y * dx3));
2288 while ((uintptr_t)(buf) < end)
2294 bx = (-O1 + dx1 - 1) / dx1;
2300 if (dy2 <= 0)
return;
2301 const int32_t by = (-O2 + dy2 - 1) / dy2;
2305 const int32_t offs = by * stride;
2309 bx =
max(bx, ((-O2 + dx2 - 1) / dx2));
2315 if (dy3 <= 0)
return;
2316 const int32_t by = (-O3 + dy3 - 1) / dy3;
2320 const int32_t offs = by * stride;
2324 bx =
max(bx, ((-O3 + dx3 - 1) / dx3));
2327 int32_t C1 = O1 + (dx1 * bx) + E;
2328 int32_t C2 = O2 + (dx2 * bx);
2329 int32_t C3 = O3 + (dx3 * bx);
2331 float tx = ((T1.
x * C1) + (T2.
x * C2) + (T3.
x * C3)) - 0.5f;
2332 float ty = ((T1.
y * C1) + (T2.
y * C2) + (T3.
y * C3)) - 0.5f;
2334 while ((bx < lx) && ((C2 | C3) >= 0))
2336 const float xx = tx;
2337 const float yy = ty;
2338 const int ttx = (int)floorf(xx);
2339 const int tty = (int)floorf(yy);
2340 const float ax = xx - ttx;
2341 const float ay = yy - tty;
2343 const int minx =
shaderclip(ttx, texsize_x_mm);
2344 const int maxx =
shaderclip(ttx + 1, texsize_x_mm);
2345 const int miny =
shaderclip(tty, texsize_y_mm) * texstride;
2346 const int maxy =
shaderclip(tty + 1, texsize_y_mm) * texstride;
2348 color_t_tex col =
interpolateColorsBilinear(tex[minx + miny], tex[maxx + miny], tex[minx + maxy], tex[maxx + maxy], ax, ay);
2350 buf[bx] = (color_t_im)((*data.p_blend_op)(col, buf[bx]));
const RGB32 RGB32_Red
Color red in RGB32 format.
RGB565 interpolateColorsBilinear(const RGB565 &C00, const RGB565 &C10, const RGB565 &C01, const RGB565 &C11, const float ax, const float ay)
Bilinear interpolation between 4 colors.
Definition: Color.h:621
RGB565 interpolateColorsTriangle(const RGB565 &col1, int32_t C1, const RGB565 &col2, int32_t C2, const RGB565 &col3, const int32_t totC)
Interpolate between 3 colors.
Definition: Color.h:591
TGX_INLINE T max(const T &a, const T &b)
Don't know why but much faster than fmaxf() for floats.
Definition: Misc.h:184
TGX_INLINE float fast_inv(float x)
Fast (approximate) computation of 1/x.
Definition: Misc.h:219
Triangle shader parameters.
void shader_test(const int32_t &offset, const int32_t &lx, const int32_t &ly, const int32_t &dx1, const int32_t &dy1, int32_t O1, const tgx::RasterizerVec4 &fP1, const int32_t &dx2, const int32_t &dy2, int32_t O2, const tgx::RasterizerVec4 &fP2, const int32_t &dx3, const int32_t &dy3, int32_t O3, const tgx::RasterizerVec4 &fP3, const tgx::RasterizerParams< color_t, color_t, ZBUFFER_t > &data)
For test purposes...
Definition: Shaders.h:45
void shader_select(const int32_t &offset, const int32_t &lx, const int32_t &ly, const int32_t dx1, const int32_t dy1, int32_t O1, const RasterizerVec4 &fP1, const int32_t dx2, const int32_t dy2, int32_t O2, const RasterizerVec4 &fP2, const int32_t dx3, const int32_t dy3, int32_t O3, const RasterizerVec4 &fP3, const RasterizerParams< color_t, color_t, ZBUFFER_t > &data)
META-Shader THAT DISPATCH TO THE CORRECT Shader ABOVE (IF ENABLED).
Definition: Shaders.h:1744
void shader_Gouraud_Texture(const int32_t &offset, const int32_t &lx, const int32_t &ly, const int32_t dx1, const int32_t dy1, int32_t O1, const RasterizerVec4 &fP1, const int32_t dx2, const int32_t dy2, int32_t O2, const RasterizerVec4 &fP2, const int32_t dx3, const int32_t dy3, int32_t O3, const RasterizerVec4 &fP3, const RasterizerParams< color_t, color_t, ZBUFFER_t > &data)
TEXTURE + GOURAUD SHADING (NO ZBUFFER)
Definition: Shaders.h:382
void shader_2D_texture(const int32_t &offset, const int32_t &lx, const int32_t &ly, const int32_t dx1, const int32_t dy1, int32_t O1, const RasterizerVec4 &fP1, const int32_t dx2, const int32_t dy2, int32_t O2, const RasterizerVec4 &fP2, const int32_t dx3, const int32_t dy3, int32_t O3, const RasterizerVec4 &fP3, const RasterizerParams< color_t_im, color_t_tex, float > &data)
2D shader (texture)
Definition: Shaders.h:2046
void shader_Flat(const int32_t &offset, const int32_t &lx, const int32_t &ly, const int32_t &dx1, const int32_t &dy1, int32_t O1, const RasterizerVec4 &fP1, const int32_t &dx2, const int32_t &dy2, int32_t O2, const RasterizerVec4 &fP2, const int32_t &dx3, const int32_t &dy3, int32_t O3, const RasterizerVec4 &fP3, const RasterizerParams< color_t, color_t, ZBUFFER_t > &data)
FLAT SHADING (NO ZBUFFER)
Definition: Shaders.h:74
void shader_Flat_Texture(const int32_t &offset, const int32_t &lx, const int32_t &ly, const int32_t dx1, const int32_t dy1, int32_t O1, const RasterizerVec4 &fP1, const int32_t dx2, const int32_t dy2, int32_t O2, const RasterizerVec4 &fP2, const int32_t dx3, const int32_t dy3, int32_t O3, const RasterizerVec4 &fP3, const RasterizerParams< color_t, color_t, ZBUFFER_t > &data)
TEXTURE + FLAT SHADING (NO ZBUFFER)
Definition: Shaders.h:230
void shader_Gouraud(const int32_t &offset, const int32_t &lx, const int32_t &ly, const int32_t &dx1, const int32_t &dy1, int32_t O1, const RasterizerVec4 &fP1, const int32_t &dx2, const int32_t &dy2, int32_t O2, const RasterizerVec4 &fP2, const int32_t &dx3, const int32_t &dy3, int32_t O3, const RasterizerVec4 &fP3, const RasterizerParams< color_t, color_t, ZBUFFER_t > &data)
GOURAUD SHADING (NO Z BUFFER)
Definition: Shaders.h:149
void shader_Flat_Texture_Zbuffer_Ortho(const int32_t &offset, const int32_t &lx, const int32_t &ly, const int32_t dx1, const int32_t dy1, int32_t O1, const RasterizerVec4 &fP1, const int32_t dx2, const int32_t dy2, int32_t O2, const RasterizerVec4 &fP2, const int32_t dx3, const int32_t dy3, int32_t O3, const RasterizerVec4 &fP3, const RasterizerParams< color_t, color_t, ZBUFFER_t > &data)
ZBUFFER + TEXTURE + FLAT SHADING + ORTHOGRAPHIC.
Definition: Shaders.h:1397
void shader_Gouraud_Texture_Ortho(const int32_t &offset, const int32_t &lx, const int32_t &ly, const int32_t dx1, const int32_t dy1, int32_t O1, const RasterizerVec4 &fP1, const int32_t dx2, const int32_t dy2, int32_t O2, const RasterizerVec4 &fP2, const int32_t dx3, const int32_t dy3, int32_t O3, const RasterizerVec4 &fP3, const RasterizerParams< color_t, color_t, ZBUFFER_t > &data)
TEXTURE + GOURAUD SHADING (NO ZBUFFER) + ORTHOGRAPHIC.
Definition: Shaders.h:1243
void shader_Flat_Texture_Zbuffer(const int32_t &offset, const int32_t &lx, const int32_t &ly, const int32_t dx1, const int32_t dy1, int32_t O1, const RasterizerVec4 &fP1, const int32_t dx2, const int32_t dy2, int32_t O2, const RasterizerVec4 &fP2, const int32_t dx3, const int32_t dy3, int32_t O3, const RasterizerVec4 &fP3, const RasterizerParams< color_t, color_t, ZBUFFER_t > &data)
ZBUFFER + TEXTURE + FLAT SHADING.
Definition: Shaders.h:755
void shader_Flat_Texture_Ortho(const int32_t &offset, const int32_t &lx, const int32_t &ly, const int32_t dx1, const int32_t dy1, int32_t O1, const RasterizerVec4 &fP1, const int32_t dx2, const int32_t dy2, int32_t O2, const RasterizerVec4 &fP2, const int32_t dx3, const int32_t dy3, int32_t O3, const RasterizerVec4 &fP3, const RasterizerParams< color_t, color_t, ZBUFFER_t > &data)
TEXTURE + FLAT SHADING (NO ZBUFFER) + ORTHOGRAPHIC.
Definition: Shaders.h:1101
void shader_Gouraud_Texture_Zbuffer_Ortho(const int32_t &offset, const int32_t &lx, const int32_t &ly, const int32_t dx1, const int32_t dy1, int32_t O1, const RasterizerVec4 &fP1, const int32_t dx2, const int32_t dy2, int32_t O2, const RasterizerVec4 &fP2, const int32_t dx3, const int32_t dy3, int32_t O3, const RasterizerVec4 &fP3, const RasterizerParams< color_t, color_t, ZBUFFER_t > &data)
ZBUFFER + TEXTURE + GOURAUD SHADING + ORTHOGRAPHIC.
Definition: Shaders.h:1564
void shader_Gouraud_Zbuffer(const int32_t &offset, const int32_t &lx, const int32_t &ly, const int32_t dx1, const int32_t dy1, int32_t O1, const RasterizerVec4 &fP1, const int32_t dx2, const int32_t dy2, int32_t O2, const RasterizerVec4 &fP2, const int32_t dx3, const int32_t dy3, int32_t O3, const RasterizerVec4 &fP3, const RasterizerParams< color_t, color_t, ZBUFFER_t > &data)
ZBUFFER + GOURAUD SHADING.
Definition: Shaders.h:649
void shader_2D_gradient(const int32_t &offset, const int32_t &lx, const int32_t &ly, const int32_t dx1, const int32_t dy1, int32_t O1, const RasterizerVec4 &fP1, const int32_t dx2, const int32_t dy2, int32_t O2, const RasterizerVec4 &fP2, const int32_t dx3, const int32_t dy3, int32_t O3, const RasterizerVec4 &fP3, const RasterizerParams< color_t_im, color_t_im, float > &data)
2D shader (gradient)
Definition: Shaders.h:1955
TGX_INLINE int shaderclip(int v, int maxv)
for texture clamping
Definition: Shaders.h:34
void shader_Flat_Zbuffer(const int32_t offset, const int32_t &lx, const int32_t &ly, const int32_t &dx1, const int32_t &dy1, int32_t O1, const RasterizerVec4 &fP1, const int32_t &dx2, const int32_t &dy2, int32_t O2, const RasterizerVec4 &fP2, const int32_t &dx3, const int32_t &dy3, int32_t O3, const RasterizerVec4 &fP3, const RasterizerParams< color_t, color_t, ZBUFFER_t > &data)
ZBUFFER + FLAT SHADING.
Definition: Shaders.h:547
void shader_Gouraud_Texture_Zbuffer(const int32_t &offset, const int32_t &lx, const int32_t &ly, const int32_t dx1, const int32_t dy1, int32_t O1, const RasterizerVec4 &fP1, const int32_t dx2, const int32_t dy2, int32_t O2, const RasterizerVec4 &fP2, const int32_t dx3, const int32_t dy3, int32_t O3, const RasterizerVec4 &fP3, const RasterizerParams< color_t, color_t, ZBUFFER_t > &data)
ZBUFFER + TEXTURE + GOURAUD SHADING.
Definition: Shaders.h:923
void shader_2D_texture_blend_op(const int32_t &offset, const int32_t &lx, const int32_t &ly, const int32_t dx1, const int32_t dy1, int32_t O1, const RasterizerVec4 &fP1, const int32_t dx2, const int32_t dy2, int32_t O2, const RasterizerVec4 &fP2, const int32_t dx3, const int32_t dy3, int32_t O3, const RasterizerVec4 &fP3, const RasterizerParams< color_t_im, color_t_tex, float, BLEND_OP > &data)
2D shader (texture with custom blending operator)
Definition: Shaders.h:2244
Color in R8/G8/B8/A8 format.
Definition: Color.h:1176
void mult256(int mr, int mg, int mb)
Multiply each color component by a given factor m/256 with m in [0,256] except the A component.
Definition: Color.h:1590
void blend256(const RGB32 &fg_col, uint32_t alpha)
alpha-blend fg_col over this one with a given opacity in the range 0.0f (fully transparent) to 1....
Definition: Color.h:1561
void blend(const RGB32 &fg_col, float alpha)
alpha-blend fg_col over this one with a given opacity in the range 0.0f (fully transparent) to 1....
Definition: Color.h:1546
float opacity() const
Return the opacity (alpha channel value) of this color in the range [0,1] (0=fully transparent,...
Definition: Color.h:1629
float opacity() const
Dummy function for compatibility with color types having an alpha channel.
Definition: Color.h:565
Color in R16/G16/B16/A16 format.
Definition: Color.h:1791
Color in R,G,B float format.
Definition: Color.h:2407
float R
Red channel.
Definition: Color.h:2420
float B
Blue channel.
Definition: Color.h:2422
float G
Green channel.
Definition: Color.h:2421
T x
'x' coordinate (first dimension)
Definition: Vec2.h:72
T y
'y' coordinate (second dimension)
Definition: Vec2.h:73