1 /*
2     Copyright (c) 2005-2021 Intel Corporation
3 
4     Licensed under the Apache License, Version 2.0 (the "License");
5     you may not use this file except in compliance with the License.
6     You may obtain a copy of the License at
7 
8         http://www.apache.org/licenses/LICENSE-2.0
9 
10     Unless required by applicable law or agreed to in writing, software
11     distributed under the License is distributed on an "AS IS" BASIS,
12     WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13     See the License for the specific language governing permissions and
14     limitations under the License.
15 */
16 
17 /*
18     The original source for this example is
19     Copyright (c) 1994-2008 John E. Stone
20     All rights reserved.
21 
22     Redistribution and use in source and binary forms, with or without
23     modification, are permitted provided that the following conditions
24     are met:
25     1. Redistributions of source code must retain the above copyright
26        notice, this list of conditions and the following disclaimer.
27     2. Redistributions in binary form must reproduce the above copyright
28        notice, this list of conditions and the following disclaimer in the
29        documentation and/or other materials provided with the distribution.
30     3. The name of the author may not be used to endorse or promote products
31        derived from this software without specific prior written permission.
32 
33     THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS
34     OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
35     WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
36     ARE DISCLAIMED.  IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY
37     DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
38     DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
39     OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
40     HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
41     LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
42     OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
43     SUCH DAMAGE.
44 */
45 
46 #include "machine.hpp"
47 #include "types.hpp"
48 #include "macros.hpp"
49 #include "vector.hpp"
50 #include "tgafile.hpp"
51 #include "trace.hpp"
52 #include "light.hpp"
53 #include "shade.hpp"
54 #include "camera.hpp"
55 #include "util.hpp"
56 #include "intersect.hpp"
57 #include "global.hpp"
58 #include "ui.hpp"
59 #include "tachyon_video.hpp"
60 
61 // shared but read-only so could be private too
62 static thr_parms *all_parms;
63 static scenedef scene;
64 static int startx;
65 static int stopx;
66 static int starty;
67 static int stopy;
68 static flt jitterscale;
69 static int totaly;
70 
71 #include "oneapi/tbb/parallel_for.h"
72 #include "oneapi/tbb/spin_mutex.h"
73 #include "oneapi/tbb/blocked_range.h"
74 #include "oneapi/tbb/global_control.h"
75 #include "common/utility/get_default_num_threads.hpp"
76 
77 static oneapi::tbb::spin_mutex MyMutex, MyMutex2;
78 
render_one_pixel(int x,int y,unsigned int * local_mbox,unsigned int & serial,int startx,int stopx,int starty,int stopy)79 static color_t render_one_pixel(int x,
80                                 int y,
81                                 unsigned int *local_mbox,
82                                 unsigned int &serial,
83                                 int startx,
84                                 int stopx,
85                                 int starty,
86                                 int stopy) {
87     /* private vars moved inside loop */
88     ray primary, sample;
89     color col, avcol;
90     int R, G, B;
91     intersectstruct local_intersections;
92     int alias;
93     /* end private */
94 
95     primary = camray(&scene, x, y);
96     primary.intstruct = &local_intersections;
97     primary.flags = RT_RAY_REGULAR;
98 
99     serial++;
100     primary.serial = serial;
101     primary.mbox = local_mbox;
102     primary.maxdist = FHUGE;
103     primary.scene = &scene;
104     col = trace(&primary);
105 
106     serial = primary.serial;
107 
108     /* perform antialiasing if enabled.. */
109     if (scene.antialiasing > 0) {
110         for (alias = 0; alias < scene.antialiasing; alias++) {
111             serial++; /* increment serial number */
112             sample = primary; /* copy the regular primary ray to start with */
113             sample.serial = serial;
114 
115             {
116                 oneapi::tbb::spin_mutex::scoped_lock lock(MyMutex);
117                 sample.d.x += ((rand() % 100) - 50) / jitterscale;
118                 sample.d.y += ((rand() % 100) - 50) / jitterscale;
119                 sample.d.z += ((rand() % 100) - 50) / jitterscale;
120             }
121 
122             avcol = trace(&sample);
123 
124             serial = sample.serial; /* update our overall serial # */
125 
126             col.r += avcol.r;
127             col.g += avcol.g;
128             col.b += avcol.b;
129         }
130 
131         col.r /= (scene.antialiasing + 1.0);
132         col.g /= (scene.antialiasing + 1.0);
133         col.b /= (scene.antialiasing + 1.0);
134     }
135 
136     /* Handle overexposure and underexposure here... */
137     R = (int)(col.r * 255);
138     if (R > 255)
139         R = 255;
140     else if (R < 0)
141         R = 0;
142 
143     G = (int)(col.g * 255);
144     if (G > 255)
145         G = 255;
146     else if (G < 0)
147         G = 0;
148 
149     B = (int)(col.b * 255);
150     if (B > 255)
151         B = 255;
152     else if (B < 0)
153         B = 0;
154 
155     return video->get_color(R, G, B);
156 }
157 
158 class parallel_task {
159 public:
operator ()(const oneapi::tbb::blocked_range<int> & r) const160     void operator()(const oneapi::tbb::blocked_range<int> &r) const {
161         // task-local storage
162         unsigned int serial = 1;
163         unsigned int mboxsize = sizeof(unsigned int) * (max_objectid() + 20);
164         unsigned int *local_mbox = (unsigned int *)alloca(mboxsize);
165         memset(local_mbox, 0, mboxsize);
166 
167         for (int y = r.begin(); y != r.end(); ++y) {
168             {
169                 drawing_area drawing(startx, totaly - y, stopx - startx, 1);
170                 for (int x = startx; x < stopx; x++) {
171                     color_t c =
172                         render_one_pixel(x, y, local_mbox, serial, startx, stopx, starty, stopy);
173                     drawing.put_pixel(c);
174                 }
175             }
176             if (!video->next_frame())
177                 return;
178         }
179     }
180 
parallel_task()181     parallel_task() {}
182 };
183 
thread_trace(thr_parms * parms)184 void *thread_trace(thr_parms *parms) {
185     int n, nthreads = utility::get_default_num_threads();
186     char *nthreads_str = getenv("TBB_NUM_THREADS");
187     if (nthreads_str && (sscanf(nthreads_str, "%d", &n) > 0) && (n > 0))
188         nthreads = n;
189     oneapi::tbb::global_control c(oneapi::tbb::global_control::max_allowed_parallelism, nthreads);
190 
191     // shared but read-only so could be private too
192     all_parms = parms;
193     scene = parms->scene;
194     startx = parms->startx;
195     stopx = parms->stopx;
196     starty = parms->starty;
197     stopy = parms->stopy;
198     jitterscale = 40.0 * (scene.hres + scene.vres);
199     totaly = parms->scene.vres - 1;
200 
201     int g, grain_size = 1;
202     char *grain_str = getenv("TBB_GRAINSIZE");
203     if (grain_str && (sscanf(grain_str, "%d", &g) > 0) && (g > 0))
204         grain_size = g;
205     char *sched_str = getenv("TBB_PARTITIONER");
206     static oneapi::tbb::affinity_partitioner g_ap;
207     if (sched_str && !strncmp(sched_str, "aff", 3))
208         oneapi::tbb::parallel_for(
209             oneapi::tbb::blocked_range<int>(starty, stopy, grain_size), parallel_task(), g_ap);
210     else if (sched_str && !strncmp(sched_str, "simp", 4))
211         oneapi::tbb::parallel_for(oneapi::tbb::blocked_range<int>(starty, stopy, grain_size),
212                                   parallel_task(),
213                                   oneapi::tbb::simple_partitioner());
214     else
215         oneapi::tbb::parallel_for(oneapi::tbb::blocked_range<int>(starty, stopy, grain_size),
216                                   parallel_task(),
217                                   oneapi::tbb::auto_partitioner());
218 
219     return (nullptr);
220 }
221