1d86ed7fbStbbdev /*
2*b15aabb3Stbbdev     Copyright (c) 2005-2021 Intel Corporation
3d86ed7fbStbbdev 
4d86ed7fbStbbdev     Licensed under the Apache License, Version 2.0 (the "License");
5d86ed7fbStbbdev     you may not use this file except in compliance with the License.
6d86ed7fbStbbdev     You may obtain a copy of the License at
7d86ed7fbStbbdev 
8d86ed7fbStbbdev         http://www.apache.org/licenses/LICENSE-2.0
9d86ed7fbStbbdev 
10d86ed7fbStbbdev     Unless required by applicable law or agreed to in writing, software
11d86ed7fbStbbdev     distributed under the License is distributed on an "AS IS" BASIS,
12d86ed7fbStbbdev     WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13d86ed7fbStbbdev     See the License for the specific language governing permissions and
14d86ed7fbStbbdev     limitations under the License.
15d86ed7fbStbbdev */
16d86ed7fbStbbdev 
17d86ed7fbStbbdev /*
18d86ed7fbStbbdev     The original source for this example is
19d86ed7fbStbbdev     Copyright (c) 1994-2008 John E. Stone
20d86ed7fbStbbdev     All rights reserved.
21d86ed7fbStbbdev 
22d86ed7fbStbbdev     Redistribution and use in source and binary forms, with or without
23d86ed7fbStbbdev     modification, are permitted provided that the following conditions
24d86ed7fbStbbdev     are met:
25d86ed7fbStbbdev     1. Redistributions of source code must retain the above copyright
26d86ed7fbStbbdev        notice, this list of conditions and the following disclaimer.
27d86ed7fbStbbdev     2. Redistributions in binary form must reproduce the above copyright
28d86ed7fbStbbdev        notice, this list of conditions and the following disclaimer in the
29d86ed7fbStbbdev        documentation and/or other materials provided with the distribution.
30d86ed7fbStbbdev     3. The name of the author may not be used to endorse or promote products
31d86ed7fbStbbdev        derived from this software without specific prior written permission.
32d86ed7fbStbbdev 
33d86ed7fbStbbdev     THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS
34d86ed7fbStbbdev     OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
35d86ed7fbStbbdev     WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
36d86ed7fbStbbdev     ARE DISCLAIMED.  IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY
37d86ed7fbStbbdev     DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
38d86ed7fbStbbdev     DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
39d86ed7fbStbbdev     OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
40d86ed7fbStbbdev     HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
41d86ed7fbStbbdev     LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
42d86ed7fbStbbdev     OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
43d86ed7fbStbbdev     SUCH DAMAGE.
44d86ed7fbStbbdev */
45d86ed7fbStbbdev 
46d86ed7fbStbbdev #include <omp.h>
47d86ed7fbStbbdev #include "machine.hpp"
48d86ed7fbStbbdev #include "types.hpp"
49d86ed7fbStbbdev #include "macros.hpp"
50d86ed7fbStbbdev #include "vector.hpp"
51d86ed7fbStbbdev #include "tgafile.hpp"
52d86ed7fbStbbdev #include "trace.hpp"
53d86ed7fbStbbdev #include "light.hpp"
54d86ed7fbStbbdev #include "shade.hpp"
55d86ed7fbStbbdev #include "camera.hpp"
56d86ed7fbStbbdev #include "util.hpp"
57d86ed7fbStbbdev #include "intersect.hpp"
58d86ed7fbStbbdev #include "global.hpp"
59d86ed7fbStbbdev #include "ui.hpp"
60d86ed7fbStbbdev #include "tachyon_video.hpp"
61d86ed7fbStbbdev 
62d86ed7fbStbbdev // shared but read-only so could be private too
63d86ed7fbStbbdev static thr_parms *all_parms;
64d86ed7fbStbbdev static scenedef scene;
65d86ed7fbStbbdev static int startx;
66d86ed7fbStbbdev static int stopx;
67d86ed7fbStbbdev static int starty;
68d86ed7fbStbbdev static int stopy;
69d86ed7fbStbbdev static flt jitterscale;
70d86ed7fbStbbdev static int totaly;
71d86ed7fbStbbdev 
render_one_pixel(int x,int y,unsigned int * local_mbox,unsigned int & serial,int startx,int stopx,int starty,int stopy)72d86ed7fbStbbdev static color_t render_one_pixel(int x,
73d86ed7fbStbbdev                                 int y,
74d86ed7fbStbbdev                                 unsigned int *local_mbox,
75d86ed7fbStbbdev                                 unsigned int &serial,
76d86ed7fbStbbdev                                 int startx,
77d86ed7fbStbbdev                                 int stopx,
78d86ed7fbStbbdev                                 int starty,
79d86ed7fbStbbdev                                 int stopy) {
80d86ed7fbStbbdev     /* private vars moved inside loop */
81d86ed7fbStbbdev     ray primary, sample;
82d86ed7fbStbbdev     color col, avcol;
83d86ed7fbStbbdev     int R, G, B;
84d86ed7fbStbbdev     intersectstruct local_intersections;
85d86ed7fbStbbdev     int alias;
86d86ed7fbStbbdev     /* end private */
87d86ed7fbStbbdev 
88d86ed7fbStbbdev     primary = camray(&scene, x, y);
89d86ed7fbStbbdev     primary.intstruct = &local_intersections;
90d86ed7fbStbbdev     primary.flags = RT_RAY_REGULAR;
91d86ed7fbStbbdev 
92d86ed7fbStbbdev     serial++;
93d86ed7fbStbbdev     primary.serial = serial;
94d86ed7fbStbbdev     primary.mbox = local_mbox;
95d86ed7fbStbbdev     primary.maxdist = FHUGE;
96d86ed7fbStbbdev     primary.scene = &scene;
97d86ed7fbStbbdev     col = trace(&primary);
98d86ed7fbStbbdev 
99d86ed7fbStbbdev     serial = primary.serial;
100d86ed7fbStbbdev 
101d86ed7fbStbbdev     /* perform antialiasing if enabled.. */
102d86ed7fbStbbdev     if (scene.antialiasing > 0) {
103d86ed7fbStbbdev         for (alias = 0; alias < scene.antialiasing; alias++) {
104d86ed7fbStbbdev             serial++; /* increment serial number */
105d86ed7fbStbbdev             sample = primary; /* copy the regular primary ray to start with */
106d86ed7fbStbbdev             sample.serial = serial;
107d86ed7fbStbbdev 
108d86ed7fbStbbdev #pragma omp critical
109d86ed7fbStbbdev             {
110d86ed7fbStbbdev                 sample.d.x += ((rand() % 100) - 50) / jitterscale;
111d86ed7fbStbbdev                 sample.d.y += ((rand() % 100) - 50) / jitterscale;
112d86ed7fbStbbdev                 sample.d.z += ((rand() % 100) - 50) / jitterscale;
113d86ed7fbStbbdev             }
114d86ed7fbStbbdev 
115d86ed7fbStbbdev             avcol = trace(&sample);
116d86ed7fbStbbdev 
117d86ed7fbStbbdev             serial = sample.serial; /* update our overall serial # */
118d86ed7fbStbbdev 
119d86ed7fbStbbdev             col.r += avcol.r;
120d86ed7fbStbbdev             col.g += avcol.g;
121d86ed7fbStbbdev             col.b += avcol.b;
122d86ed7fbStbbdev         }
123d86ed7fbStbbdev 
124d86ed7fbStbbdev         col.r /= (scene.antialiasing + 1.0);
125d86ed7fbStbbdev         col.g /= (scene.antialiasing + 1.0);
126d86ed7fbStbbdev         col.b /= (scene.antialiasing + 1.0);
127d86ed7fbStbbdev     }
128d86ed7fbStbbdev 
129d86ed7fbStbbdev     /* Handle overexposure and underexposure here... */
130d86ed7fbStbbdev     R = (int)(col.r * 255);
131d86ed7fbStbbdev     if (R > 255)
132d86ed7fbStbbdev         R = 255;
133d86ed7fbStbbdev     else if (R < 0)
134d86ed7fbStbbdev         R = 0;
135d86ed7fbStbbdev 
136d86ed7fbStbbdev     G = (int)(col.g * 255);
137d86ed7fbStbbdev     if (G > 255)
138d86ed7fbStbbdev         G = 255;
139d86ed7fbStbbdev     else if (G < 0)
140d86ed7fbStbbdev         G = 0;
141d86ed7fbStbbdev 
142d86ed7fbStbbdev     B = (int)(col.b * 255);
143d86ed7fbStbbdev     if (B > 255)
144d86ed7fbStbbdev         B = 255;
145d86ed7fbStbbdev     else if (B < 0)
146d86ed7fbStbbdev         B = 0;
147d86ed7fbStbbdev 
148d86ed7fbStbbdev     return video->get_color(R, G, B);
149d86ed7fbStbbdev }
150d86ed7fbStbbdev 
parallel_thread(void)151d86ed7fbStbbdev static void parallel_thread(void) {
152d86ed7fbStbbdev     // thread-local storage
153d86ed7fbStbbdev     unsigned int serial = 1;
154d86ed7fbStbbdev     unsigned int mboxsize = sizeof(unsigned int) * (max_objectid() + 20);
155d86ed7fbStbbdev     unsigned int *local_mbox = (unsigned int *)alloca(mboxsize);
156d86ed7fbStbbdev     memset(local_mbox, 0, mboxsize);
157d86ed7fbStbbdev 
158d86ed7fbStbbdev #pragma omp for nowait schedule(runtime)
159d86ed7fbStbbdev     for (int y = starty; y < stopy; y++) {
160d86ed7fbStbbdev         if (!video->running)
161d86ed7fbStbbdev             continue;
162d86ed7fbStbbdev         drawing_area drawing(startx, totaly - y, stopx - startx, 1);
163d86ed7fbStbbdev         for (int x = startx; x < stopx; x++) {
164d86ed7fbStbbdev             color_t c = render_one_pixel(x, y, local_mbox, serial, startx, stopx, starty, stopy);
165d86ed7fbStbbdev             drawing.put_pixel(c);
166d86ed7fbStbbdev         }
167d86ed7fbStbbdev         video->next_frame();
168d86ed7fbStbbdev     }
169d86ed7fbStbbdev }
170d86ed7fbStbbdev 
thread_trace(thr_parms * parms)171d86ed7fbStbbdev void *thread_trace(thr_parms *parms) {
172d86ed7fbStbbdev     // shared but read-only so could be private too
173d86ed7fbStbbdev     all_parms = parms;
174d86ed7fbStbbdev     scene = parms->scene;
175d86ed7fbStbbdev     startx = parms->startx;
176d86ed7fbStbbdev     stopx = parms->stopx;
177d86ed7fbStbbdev     starty = parms->starty;
178d86ed7fbStbbdev     stopy = parms->stopy;
179d86ed7fbStbbdev     jitterscale = 40.0 * (scene.hres + scene.vres);
180d86ed7fbStbbdev     totaly = parms->scene.vres - 1;
181d86ed7fbStbbdev 
182d86ed7fbStbbdev #pragma omp parallel
183d86ed7fbStbbdev     parallel_thread();
184d86ed7fbStbbdev 
185d86ed7fbStbbdev     return (nullptr);
186d86ed7fbStbbdev }
187