examples/raytrace/render.cc - third_party/tinygltf - Git at Google

 /*
 The MIT License (MIT)

 Copyright (c) 2015 - 2016 Light Transport Entertainment, Inc.

 Permission is hereby granted, free of charge, to any person obtaining a copy
 of this software and associated documentation files (the "Software"), to deal
 in the Software without restriction, including without limitation the rights
 to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
 copies of the Software, and to permit persons to whom the Software is
 furnished to do so, subject to the following conditions:

 The above copyright notice and this permission notice shall be included in
 all copies or substantial portions of the Software.

 THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
 IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
 FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
 AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
 LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
 OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
 THE SOFTWARE.
 */


 #ifdef _MSC_VER
 #pragma warning(disable : 4018)
 #pragma warning(disable : 4244)
 #pragma warning(disable : 4189)
 #pragma warning(disable : 4996)
 #pragma warning(disable : 4267)
 #pragma warning(disable : 4477)
 #endif

 #include "render.h"

 #include <chrono>  // C++11
 #include <sstream>
 #include <thread>  // C++11
 #include <vector>

 #include <iostream>

 #include "nanort.h"
 #include "matrix.h"
 #include "material.h"
 #include "mesh.h"


 #include "trackball.h"


 #ifdef WIN32
 #undef min
 #undef max
 #endif

 namespace example {

 // PCG32 code / (c) 2014 M.E. O'Neill / pcg-random.org
 // Licensed under Apache License 2.0 (NO WARRANTY, etc. see website)
 // http://www.pcg-random.org/
 typedef struct {
   unsigned long long state;
   unsigned long long inc;  // not used?
 } pcg32_state_t;

 #define PCG32_INITIALIZER \
   { 0x853c49e6748fea9bULL, 0xda3e39cb94b95bdbULL }

 float pcg32_random(pcg32_state_t* rng) {
   unsigned long long oldstate = rng->state;
   rng->state = oldstate * 6364136223846793005ULL + rng->inc;
   unsigned int xorshifted = ((oldstate >> 18u) ^ oldstate) >> 27u;
   unsigned int rot = oldstate >> 59u;
   unsigned int ret = (xorshifted >> rot) | (xorshifted << ((-static_cast<int>(rot)) & 31));

   return (float)((double)ret / (double)4294967296.0);
 }

 void pcg32_srandom(pcg32_state_t* rng, uint64_t initstate, uint64_t initseq) {
   rng->state = 0U;
   rng->inc = (initseq << 1U) | 1U;
   pcg32_random(rng);
   rng->state += initstate;
   pcg32_random(rng);
 }

 const float kPI = 3.141592f;

 typedef nanort::real3<float> float3;

 inline float3 Lerp3(float3 v0, float3 v1, float3 v2, float u, float v) {
   return (1.0f - u - v) * v0 + u * v1 + v * v2;
 }

 inline void CalcNormal(float3& N, float3 v0, float3 v1, float3 v2) {
   float3 v10 = v1 - v0;
   float3 v20 = v2 - v0;

   N = vcross(v20, v10);
   N = vnormalize(N);
 }

 void BuildCameraFrame(float3* origin, float3* corner, float3* u, float3* v,
                       float quat[4], float eye[3], float lookat[3], float up[3],
                       float fov, int width, int height) {
   float e[4][4];

   Matrix::LookAt(e, eye, lookat, up);

   float r[4][4];
   build_rotmatrix(r, quat);

   float3 lo;
   lo[0] = lookat[0] - eye[0];
   lo[1] = lookat[1] - eye[1];
   lo[2] = lookat[2] - eye[2];
   float dist = vlength(lo);

   float dir[3];
   dir[0] = 0.0;
   dir[1] = 0.0;
   dir[2] = dist;

   Matrix::Inverse(r);

   float rr[4][4];
   float re[4][4];
   float zero[3] = {0.0f, 0.0f, 0.0f};
   float localUp[3] = {0.0f, 1.0f, 0.0f};
   Matrix::LookAt(re, dir, zero, localUp);

   // translate
   re[3][0] += eye[0];  // 0.0; //lo[0];
   re[3][1] += eye[1];  // 0.0; //lo[1];
   re[3][2] += (eye[2] - dist);

   // rot -> trans
   Matrix::Mult(rr, r, re);

   float m[4][4];
   for (int j = 0; j < 4; j++) {
     for (int i = 0; i < 4; i++) {
       m[j][i] = rr[j][i];
     }
   }

   float vzero[3] = {0.0f, 0.0f, 0.0f};
   float eye1[3];
   Matrix::MultV(eye1, m, vzero);

   float lookat1d[3];
   dir[2] = -dir[2];
   Matrix::MultV(lookat1d, m, dir);
   float3 lookat1(lookat1d[0], lookat1d[1], lookat1d[2]);

   float up1d[3];
   Matrix::MultV(up1d, m, up);

   float3 up1(up1d[0], up1d[1], up1d[2]);

   // absolute -> relative
   up1[0] -= eye1[0];
   up1[1] -= eye1[1];
   up1[2] -= eye1[2];
   // printf("up1(after) = %f, %f, %f\n", up1[0], up1[1], up1[2]);

   // Use original up vector
   // up1[0] = up[0];
   // up1[1] = up[1];
   // up1[2] = up[2];

   {
     float flen =
         (0.5f * (float)height / tanf(0.5f * (float)(fov * kPI / 180.0f)));
     float3 look1;
     look1[0] = lookat1[0] - eye1[0];
     look1[1] = lookat1[1] - eye1[1];
     look1[2] = lookat1[2] - eye1[2];
     // vcross(u, up1, look1);
     // flip
     (*u) = nanort::vcross(look1, up1);
     (*u) = vnormalize((*u));

     (*v) = vcross(look1, (*u));
     (*v) = vnormalize((*v));

     look1 = vnormalize(look1);
     look1[0] = flen * look1[0] + eye1[0];
     look1[1] = flen * look1[1] + eye1[1];
     look1[2] = flen * look1[2] + eye1[2];
     (*corner)[0] = look1[0] - 0.5f * (width * (*u)[0] + height * (*v)[0]);
     (*corner)[1] = look1[1] - 0.5f * (width * (*u)[1] + height * (*v)[1]);
     (*corner)[2] = look1[2] - 0.5f * (width * (*u)[2] + height * (*v)[2]);

     (*origin)[0] = eye1[0];
     (*origin)[1] = eye1[1];
     (*origin)[2] = eye1[2];
   }
 }

 #if 0 // TODO(LTE): Not used method. Delete.
 nanort::Ray<float> GenerateRay(const float3& origin, const float3& corner,
                                const float3& du, const float3& dv, float u,
                                float v) {
   float3 dir;

   dir[0] = (corner[0] + u * du[0] + v * dv[0]) - origin[0];
   dir[1] = (corner[1] + u * du[1] + v * dv[1]) - origin[1];
   dir[2] = (corner[2] + u * du[2] + v * dv[2]) - origin[2];
   dir = vnormalize(dir);

   float3 org;

   nanort::Ray<float> ray;
   ray.org[0] = origin[0];
   ray.org[1] = origin[1];
   ray.org[2] = origin[2];
   ray.dir[0] = dir[0];
   ray.dir[1] = dir[1];
   ray.dir[2] = dir[2];

   return ray;
 }
 #endif

 void FetchTexture(const Texture &texture, float u, float v, float* col) {
   int tx = u * texture.width;
   int ty = (1.0f - v) * texture.height;
   int idx_offset = (ty * texture.width + tx) * texture.components;
   col[0] = texture.image[idx_offset + 0] / 255.f;
   col[1] = texture.image[idx_offset + 1] / 255.f;
   col[2] = texture.image[idx_offset + 2] / 255.f;
 }

 bool Renderer::Render(float* rgba, float* aux_rgba, int* sample_counts,
                       float quat[4],
                       const nanosg::Scene<float, example::Mesh<float>> &scene,
                       const example::Asset &asset,
                       const RenderConfig& config,
                       std::atomic<bool>& cancelFlag,
                       int &_showBufferMode
                       ) {
   //if (!gAccel.IsValid()) {
   //  return false;
   //}


   int width = config.width;
   int height = config.height;

   // camera
   float eye[3] = {config.eye[0], config.eye[1], config.eye[2]};
   float look_at[3] = {config.look_at[0], config.look_at[1], config.look_at[2]};
   float up[3] = {config.up[0], config.up[1], config.up[2]};
   float fov = config.fov;
   float3 origin, corner, u, v;
   BuildCameraFrame(&origin, &corner, &u, &v, quat, eye, look_at, up, fov, width,
                    height);

   auto kCancelFlagCheckMilliSeconds = 300;

   std::vector<std::thread> workers;
   std::atomic<int> i(0);

   uint32_t num_threads = std::max(1U, std::thread::hardware_concurrency());

   auto startT = std::chrono::system_clock::now();

   // Initialize RNG.

   for (auto t = 0; t < num_threads; t++) {
     workers.emplace_back(std::thread([&, t]() {
       pcg32_state_t rng;
       pcg32_srandom(&rng, config.pass,
                     t);  // seed = combination of render pass + thread no.

       int y = 0;
       while ((y = i++) < config.height) {
         auto currT = std::chrono::system_clock::now();

         std::chrono::duration<double, std::milli> ms = currT - startT;
         // Check cancel flag
         if (ms.count() > kCancelFlagCheckMilliSeconds) {
           if (cancelFlag) {
             break;
           }
         }

         // draw dash line to aux buffer for progress.
         // for (int x = 0; x < config.width; x++) {
         //  float c = (x / 8) % 2;
         //  aux_rgba[4*(y*config.width+x)+0] = c;
         //  aux_rgba[4*(y*config.width+x)+1] = c;
         //  aux_rgba[4*(y*config.width+x)+2] = c;
         //  aux_rgba[4*(y*config.width+x)+3] = 0.0f;
         //}

         for (int x = 0; x < config.width; x++) {
           nanort::Ray<float> ray;
           ray.org[0] = origin[0];
           ray.org[1] = origin[1];
           ray.org[2] = origin[2];

           float u0 = pcg32_random(&rng);
           float u1 = pcg32_random(&rng);

           float3 dir;

         //for modes not a "color"
 		    if(_showBufferMode != SHOW_BUFFER_COLOR)
 		    {
           //only one pass
 			    if(config.pass > 0)
 				    continue;

           //to the center of pixel
 			      u0 = 0.5f;
 			      u1 = 0.5f;
 		      }

           dir = corner + (float(x) + u0) * u +
                 (float(config.height - y - 1) + u1) * v;
           dir = vnormalize(dir);
           ray.dir[0] = dir[0];
           ray.dir[1] = dir[1];
           ray.dir[2] = dir[2];

           float kFar = 1.0e+30f;
           ray.min_t = 0.0f;
           ray.max_t = kFar;


           nanosg::Intersection<float> isect;
           bool hit = scene.Traverse(ray, &isect, /* cull_back_face */false);

           if (hit) {

             const std::vector<Material> &materials = asset.materials;
             const std::vector<Texture> &textures = asset.textures;
             const Mesh<float> &mesh = asset.meshes[isect.node_id];

 			//tigra: add default material
 			const Material &default_material = asset.default_material;

             float3 p;
             p[0] =
                 ray.org[0] + isect.t * ray.dir[0];
             p[1] =
                 ray.org[1] + isect.t * ray.dir[1];
             p[2] =
                 ray.org[2] + isect.t * ray.dir[2];

             config.positionImage[4 * (y * config.width + x) + 0] = p.x();
             config.positionImage[4 * (y * config.width + x) + 1] = p.y();
             config.positionImage[4 * (y * config.width + x) + 2] = p.z();
             config.positionImage[4 * (y * config.width + x) + 3] = 1.0f;

             config.varycoordImage[4 * (y * config.width + x) + 0] =
                 isect.u;
             config.varycoordImage[4 * (y * config.width + x) + 1] =
                 isect.v;
             config.varycoordImage[4 * (y * config.width + x) + 2] = 0.0f;
             config.varycoordImage[4 * (y * config.width + x) + 3] = 1.0f;

             unsigned int prim_id = isect.prim_id;

             float3 N;
             if (mesh.facevarying_normals.size() > 0) {
               float3 n0, n1, n2;
               n0[0] = mesh.facevarying_normals[9 * prim_id + 0];
               n0[1] = mesh.facevarying_normals[9 * prim_id + 1];
               n0[2] = mesh.facevarying_normals[9 * prim_id + 2];
               n1[0] = mesh.facevarying_normals[9 * prim_id + 3];
               n1[1] = mesh.facevarying_normals[9 * prim_id + 4];
               n1[2] = mesh.facevarying_normals[9 * prim_id + 5];
               n2[0] = mesh.facevarying_normals[9 * prim_id + 6];
               n2[1] = mesh.facevarying_normals[9 * prim_id + 7];
               n2[2] = mesh.facevarying_normals[9 * prim_id + 8];
               N = Lerp3(n0, n1, n2, isect.u, isect.v);
             } else {
               unsigned int f0, f1, f2;
               f0 = mesh.faces[3 * prim_id + 0];
               f1 = mesh.faces[3 * prim_id + 1];
               f2 = mesh.faces[3 * prim_id + 2];

               float3 v0, v1, v2;
               v0[0] = mesh.vertices[3 * f0 + 0];
               v0[1] = mesh.vertices[3 * f0 + 1];
               v0[2] = mesh.vertices[3 * f0 + 2];
               v1[0] = mesh.vertices[3 * f1 + 0];
               v1[1] = mesh.vertices[3 * f1 + 1];
               v1[2] = mesh.vertices[3 * f1 + 2];
               v2[0] = mesh.vertices[3 * f2 + 0];
               v2[1] = mesh.vertices[3 * f2 + 1];
               v2[2] = mesh.vertices[3 * f2 + 2];
               CalcNormal(N, v0, v1, v2);
             }

             config.normalImage[4 * (y * config.width + x) + 0] =
                 0.5f * N[0] + 0.5f;
             config.normalImage[4 * (y * config.width + x) + 1] =
                 0.5f * N[1] + 0.5f;
             config.normalImage[4 * (y * config.width + x) + 2] =
                 0.5f * N[2] + 0.5f;
             config.normalImage[4 * (y * config.width + x) + 3] = 1.0f;

             config.depthImage[4 * (y * config.width + x) + 0] =
                 isect.t;
             config.depthImage[4 * (y * config.width + x) + 1] =
                 isect.t;
             config.depthImage[4 * (y * config.width + x) + 2] =
                 isect.t;
             config.depthImage[4 * (y * config.width + x) + 3] = 1.0f;

             float3 UV;
             if (mesh.facevarying_uvs.size() > 0) {
               float3 uv0, uv1, uv2;
               uv0[0] = mesh.facevarying_uvs[6 * prim_id + 0];
               uv0[1] = mesh.facevarying_uvs[6 * prim_id + 1];
               uv1[0] = mesh.facevarying_uvs[6 * prim_id + 2];
               uv1[1] = mesh.facevarying_uvs[6 * prim_id + 3];
               uv2[0] = mesh.facevarying_uvs[6 * prim_id + 4];
               uv2[1] = mesh.facevarying_uvs[6 * prim_id + 5];

               UV = Lerp3(uv0, uv1, uv2, isect.u, isect.v);

               config.texcoordImage[4 * (y * config.width + x) + 0] = UV[0];
               config.texcoordImage[4 * (y * config.width + x) + 1] = UV[1];
             }

             // Fetch texture
             unsigned int material_id =
                 mesh.material_ids[isect.prim_id];

 			//printf("material_id=%d materials=%lld\n", material_id, materials.size());

             float diffuse_col[3];

             float specular_col[3];

 			//tigra: material_id is ok
 			if(material_id<materials.size())
 			{
 				//printf("ok mat\n");

 				int diffuse_texid = materials[material_id].diffuse_texid;
 				if (diffuse_texid >= 0) {
 				  FetchTexture(textures[diffuse_texid], UV[0], UV[1], diffuse_col);
 				} else {
 				  diffuse_col[0] = materials[material_id].diffuse[0];
 				  diffuse_col[1] = materials[material_id].diffuse[1];
 				  diffuse_col[2] = materials[material_id].diffuse[2];
 				}

 				int specular_texid = materials[material_id].specular_texid;
 				if (specular_texid >= 0) {
 				  FetchTexture(textures[specular_texid], UV[0], UV[1], specular_col);
 				} else {
 				  specular_col[0] = materials[material_id].specular[0];
 				  specular_col[1] = materials[material_id].specular[1];
 				  specular_col[2] = materials[material_id].specular[2];
 				}
 			}
 			else
 				//tigra: wrong material_id, use default_material
 				{

 				//printf("default_material\n");

 					diffuse_col[0] = default_material.diffuse[0];
 					diffuse_col[1] = default_material.diffuse[1];
 					diffuse_col[2] = default_material.diffuse[2];
 					specular_col[0] = default_material.specular[0];
 					specular_col[1] = default_material.specular[1];
 					specular_col[2] = default_material.specular[2];
 				}

             // Simple shading
             float NdotV = fabsf(vdot(N, dir));

             if (config.pass == 0) {
               rgba[4 * (y * config.width + x) + 0] = NdotV * diffuse_col[0];
               rgba[4 * (y * config.width + x) + 1] = NdotV * diffuse_col[1];
               rgba[4 * (y * config.width + x) + 2] = NdotV * diffuse_col[2];
               rgba[4 * (y * config.width + x) + 3] = 1.0f;
               sample_counts[y * config.width + x] =
                   1;  // Set 1 for the first pass
             } else {  // additive.
               rgba[4 * (y * config.width + x) + 0] += NdotV * diffuse_col[0];
               rgba[4 * (y * config.width + x) + 1] += NdotV * diffuse_col[1];
               rgba[4 * (y * config.width + x) + 2] += NdotV * diffuse_col[2];
               rgba[4 * (y * config.width + x) + 3] += 1.0f;
               sample_counts[y * config.width + x]++;
             }

           } else {
             {
               if (config.pass == 0) {
                 // clear pixel
                 rgba[4 * (y * config.width + x) + 0] = 0.0f;
                 rgba[4 * (y * config.width + x) + 1] = 0.0f;
                 rgba[4 * (y * config.width + x) + 2] = 0.0f;
                 rgba[4 * (y * config.width + x) + 3] = 0.0f;
                 aux_rgba[4 * (y * config.width + x) + 0] = 0.0f;
                 aux_rgba[4 * (y * config.width + x) + 1] = 0.0f;
                 aux_rgba[4 * (y * config.width + x) + 2] = 0.0f;
                 aux_rgba[4 * (y * config.width + x) + 3] = 0.0f;
                 sample_counts[y * config.width + x] =
                     1;  // Set 1 for the first pass
               } else {
                 sample_counts[y * config.width + x]++;
               }

               // No super sampling
               config.normalImage[4 * (y * config.width + x) + 0] = 0.0f;
               config.normalImage[4 * (y * config.width + x) + 1] = 0.0f;
               config.normalImage[4 * (y * config.width + x) + 2] = 0.0f;
               config.normalImage[4 * (y * config.width + x) + 3] = 0.0f;
               config.positionImage[4 * (y * config.width + x) + 0] = 0.0f;
               config.positionImage[4 * (y * config.width + x) + 1] = 0.0f;
               config.positionImage[4 * (y * config.width + x) + 2] = 0.0f;
               config.positionImage[4 * (y * config.width + x) + 3] = 0.0f;
               config.depthImage[4 * (y * config.width + x) + 0] = 0.0f;
               config.depthImage[4 * (y * config.width + x) + 1] = 0.0f;
               config.depthImage[4 * (y * config.width + x) + 2] = 0.0f;
               config.depthImage[4 * (y * config.width + x) + 3] = 0.0f;
               config.texcoordImage[4 * (y * config.width + x) + 0] = 0.0f;
               config.texcoordImage[4 * (y * config.width + x) + 1] = 0.0f;
               config.texcoordImage[4 * (y * config.width + x) + 2] = 0.0f;
               config.texcoordImage[4 * (y * config.width + x) + 3] = 0.0f;
               config.varycoordImage[4 * (y * config.width + x) + 0] = 0.0f;
               config.varycoordImage[4 * (y * config.width + x) + 1] = 0.0f;
               config.varycoordImage[4 * (y * config.width + x) + 2] = 0.0f;
               config.varycoordImage[4 * (y * config.width + x) + 3] = 0.0f;
             }
           }
         }

         for (int x = 0; x < config.width; x++) {
           aux_rgba[4 * (y * config.width + x) + 0] = 0.0f;
           aux_rgba[4 * (y * config.width + x) + 1] = 0.0f;
           aux_rgba[4 * (y * config.width + x) + 2] = 0.0f;
           aux_rgba[4 * (y * config.width + x) + 3] = 0.0f;
         }
       }
     }));
   }

   for (auto& t : workers) {
     t.join();
   }

   return (!cancelFlag);
 };

 }  // namespace example
	/*
	The MIT License (MIT)

	Copyright (c) 2015 - 2016 Light Transport Entertainment, Inc.

	Permission is hereby granted, free of charge, to any person obtaining a copy
	of this software and associated documentation files (the "Software"), to deal
	in the Software without restriction, including without limitation the rights
	to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
	copies of the Software, and to permit persons to whom the Software is
	furnished to do so, subject to the following conditions:

	The above copyright notice and this permission notice shall be included in
	all copies or substantial portions of the Software.

	THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
	IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
	FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
	AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
	LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
	OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
	THE SOFTWARE.
	*/


	#ifdef _MSC_VER
	#pragma warning(disable : 4018)
	#pragma warning(disable : 4244)
	#pragma warning(disable : 4189)
	#pragma warning(disable : 4996)
	#pragma warning(disable : 4267)
	#pragma warning(disable : 4477)
	#endif

	#include "render.h"

	#include <chrono> // C++11
	#include <sstream>
	#include <thread> // C++11
	#include <vector>

	#include <iostream>

	#include "nanort.h"
	#include "matrix.h"
	#include "material.h"
	#include "mesh.h"


	#include "trackball.h"


	#ifdef WIN32
	#undef min
	#undef max
	#endif

	namespace example {

	// PCG32 code / (c) 2014 M.E. O'Neill / pcg-random.org
	// Licensed under Apache License 2.0 (NO WARRANTY, etc. see website)
	// http://www.pcg-random.org/
	typedef struct {
	unsigned long long state;
	unsigned long long inc; // not used?
	} pcg32_state_t;

	#define PCG32_INITIALIZER \
	{ 0x853c49e6748fea9bULL, 0xda3e39cb94b95bdbULL }

	float pcg32_random(pcg32_state_t* rng) {
	unsigned long long oldstate = rng->state;
	rng->state = oldstate * 6364136223846793005ULL + rng->inc;
	unsigned int xorshifted = ((oldstate >> 18u) ^ oldstate) >> 27u;
	unsigned int rot = oldstate >> 59u;
	unsigned int ret = (xorshifted >> rot) \| (xorshifted << ((-static_cast<int>(rot)) & 31));

	return (float)((double)ret / (double)4294967296.0);
	}

	void pcg32_srandom(pcg32_state_t* rng, uint64_t initstate, uint64_t initseq) {
	rng->state = 0U;
	rng->inc = (initseq << 1U) \| 1U;
	pcg32_random(rng);
	rng->state += initstate;
	pcg32_random(rng);
	}

	const float kPI = 3.141592f;

	typedef nanort::real3<float> float3;

	inline float3 Lerp3(float3 v0, float3 v1, float3 v2, float u, float v) {
	return (1.0f - u - v) * v0 + u * v1 + v * v2;
	}

	inline void CalcNormal(float3& N, float3 v0, float3 v1, float3 v2) {
	float3 v10 = v1 - v0;
	float3 v20 = v2 - v0;

	N = vcross(v20, v10);
	N = vnormalize(N);
	}

	void BuildCameraFrame(float3* origin, float3* corner, float3* u, float3* v,
	float quat[4], float eye[3], float lookat[3], float up[3],
	float fov, int width, int height) {
	float e[4][4];

	Matrix::LookAt(e, eye, lookat, up);

	float r[4][4];
	build_rotmatrix(r, quat);

	float3 lo;
	lo[0] = lookat[0] - eye[0];
	lo[1] = lookat[1] - eye[1];
	lo[2] = lookat[2] - eye[2];
	float dist = vlength(lo);

	float dir[3];
	dir[0] = 0.0;
	dir[1] = 0.0;
	dir[2] = dist;

	Matrix::Inverse(r);

	float rr[4][4];
	float re[4][4];
	float zero[3] = {0.0f, 0.0f, 0.0f};
	float localUp[3] = {0.0f, 1.0f, 0.0f};
	Matrix::LookAt(re, dir, zero, localUp);

	// translate
	re[3][0] += eye[0]; // 0.0; //lo[0];
	re[3][1] += eye[1]; // 0.0; //lo[1];
	re[3][2] += (eye[2] - dist);

	// rot -> trans
	Matrix::Mult(rr, r, re);

	float m[4][4];
	for (int j = 0; j < 4; j++) {
	for (int i = 0; i < 4; i++) {
	m[j][i] = rr[j][i];
	}
	}

	float vzero[3] = {0.0f, 0.0f, 0.0f};
	float eye1[3];
	Matrix::MultV(eye1, m, vzero);

	float lookat1d[3];
	dir[2] = -dir[2];
	Matrix::MultV(lookat1d, m, dir);
	float3 lookat1(lookat1d[0], lookat1d[1], lookat1d[2]);

	float up1d[3];
	Matrix::MultV(up1d, m, up);

	float3 up1(up1d[0], up1d[1], up1d[2]);

	// absolute -> relative
	up1[0] -= eye1[0];
	up1[1] -= eye1[1];
	up1[2] -= eye1[2];
	// printf("up1(after) = %f, %f, %f\n", up1[0], up1[1], up1[2]);

	// Use original up vector
	// up1[0] = up[0];
	// up1[1] = up[1];
	// up1[2] = up[2];

	{
	float flen =
	(0.5f * (float)height / tanf(0.5f * (float)(fov * kPI / 180.0f)));
	float3 look1;
	look1[0] = lookat1[0] - eye1[0];
	look1[1] = lookat1[1] - eye1[1];
	look1[2] = lookat1[2] - eye1[2];
	// vcross(u, up1, look1);
	// flip
	(*u) = nanort::vcross(look1, up1);
	(u) = vnormalize((u));

	(v) = vcross(look1, (u));
	(v) = vnormalize((v));

	look1 = vnormalize(look1);
	look1[0] = flen * look1[0] + eye1[0];
	look1[1] = flen * look1[1] + eye1[1];
	look1[2] = flen * look1[2] + eye1[2];
	(corner)[0] = look1[0] - 0.5f (width * (u)[0] + height (*v)[0]);
	(corner)[1] = look1[1] - 0.5f (width * (u)[1] + height (*v)[1]);
	(corner)[2] = look1[2] - 0.5f (width * (u)[2] + height (*v)[2]);

	(*origin)[0] = eye1[0];
	(*origin)[1] = eye1[1];
	(*origin)[2] = eye1[2];
	}
	}

	#if 0 // TODO(LTE): Not used method. Delete.
	nanort::Ray<float> GenerateRay(const float3& origin, const float3& corner,
	const float3& du, const float3& dv, float u,
	float v) {
	float3 dir;

	dir[0] = (corner[0] + u * du[0] + v * dv[0]) - origin[0];
	dir[1] = (corner[1] + u * du[1] + v * dv[1]) - origin[1];
	dir[2] = (corner[2] + u * du[2] + v * dv[2]) - origin[2];
	dir = vnormalize(dir);

	float3 org;

	nanort::Ray<float> ray;
	ray.org[0] = origin[0];
	ray.org[1] = origin[1];
	ray.org[2] = origin[2];
	ray.dir[0] = dir[0];
	ray.dir[1] = dir[1];
	ray.dir[2] = dir[2];

	return ray;
	}
	#endif

	void FetchTexture(const Texture &texture, float u, float v, float* col) {
	int tx = u * texture.width;
	int ty = (1.0f - v) * texture.height;
	int idx_offset = (ty * texture.width + tx) * texture.components;
	col[0] = texture.image[idx_offset + 0] / 255.f;
	col[1] = texture.image[idx_offset + 1] / 255.f;
	col[2] = texture.image[idx_offset + 2] / 255.f;
	}

	bool Renderer::Render(float* rgba, float* aux_rgba, int* sample_counts,
	float quat[4],
	const nanosg::Scene<float, example::Mesh<float>> &scene,
	const example::Asset &asset,
	const RenderConfig& config,
	std::atomic<bool>& cancelFlag,
	int &_showBufferMode
	) {
	//if (!gAccel.IsValid()) {
	// return false;
	//}




	int width = config.width;
	int height = config.height;

	// camera
	float eye[3] = {config.eye[0], config.eye[1], config.eye[2]};
	float look_at[3] = {config.look_at[0], config.look_at[1], config.look_at[2]};
	float up[3] = {config.up[0], config.up[1], config.up[2]};
	float fov = config.fov;
	float3 origin, corner, u, v;
	BuildCameraFrame(&origin, &corner, &u, &v, quat, eye, look_at, up, fov, width,
	height);

	auto kCancelFlagCheckMilliSeconds = 300;

	std::vector<std::thread> workers;
	std::atomic<int> i(0);

	uint32_t num_threads = std::max(1U, std::thread::hardware_concurrency());

	auto startT = std::chrono::system_clock::now();

	// Initialize RNG.

	for (auto t = 0; t < num_threads; t++) {
	workers.emplace_back(std::thread([&, t]() {
	pcg32_state_t rng;
	pcg32_srandom(&rng, config.pass,
	t); // seed = combination of render pass + thread no.

	int y = 0;
	while ((y = i++) < config.height) {
	auto currT = std::chrono::system_clock::now();

	std::chrono::duration<double, std::milli> ms = currT - startT;
	// Check cancel flag
	if (ms.count() > kCancelFlagCheckMilliSeconds) {
	if (cancelFlag) {
	break;
	}
	}

	// draw dash line to aux buffer for progress.
	// for (int x = 0; x < config.width; x++) {
	// float c = (x / 8) % 2;
	// aux_rgba[4(yconfig.width+x)+0] = c;
	// aux_rgba[4(yconfig.width+x)+1] = c;
	// aux_rgba[4(yconfig.width+x)+2] = c;
	// aux_rgba[4(yconfig.width+x)+3] = 0.0f;
	//}

	for (int x = 0; x < config.width; x++) {
	nanort::Ray<float> ray;
	ray.org[0] = origin[0];
	ray.org[1] = origin[1];
	ray.org[2] = origin[2];

	float u0 = pcg32_random(&rng);
	float u1 = pcg32_random(&rng);

	float3 dir;

	//for modes not a "color"
	if(_showBufferMode != SHOW_BUFFER_COLOR)
	{
	//only one pass
	if(config.pass > 0)
	continue;

	//to the center of pixel
	u0 = 0.5f;
	u1 = 0.5f;
	}

	dir = corner + (float(x) + u0) * u +
	(float(config.height - y - 1) + u1) * v;
	dir = vnormalize(dir);
	ray.dir[0] = dir[0];
	ray.dir[1] = dir[1];
	ray.dir[2] = dir[2];

	float kFar = 1.0e+30f;
	ray.min_t = 0.0f;
	ray.max_t = kFar;


	nanosg::Intersection<float> isect;
	bool hit = scene.Traverse(ray, &isect, /* cull_back_face */false);

	if (hit) {

	const std::vector<Material> &materials = asset.materials;
	const std::vector<Texture> &textures = asset.textures;
	const Mesh<float> &mesh = asset.meshes[isect.node_id];

	//tigra: add default material
	const Material &default_material = asset.default_material;

	float3 p;
	p[0] =
	ray.org[0] + isect.t * ray.dir[0];
	p[1] =
	ray.org[1] + isect.t * ray.dir[1];
	p[2] =
	ray.org[2] + isect.t * ray.dir[2];

	config.positionImage[4 * (y * config.width + x) + 0] = p.x();
	config.positionImage[4 * (y * config.width + x) + 1] = p.y();
	config.positionImage[4 * (y * config.width + x) + 2] = p.z();
	config.positionImage[4 * (y * config.width + x) + 3] = 1.0f;

	config.varycoordImage[4 * (y * config.width + x) + 0] =
	isect.u;
	config.varycoordImage[4 * (y * config.width + x) + 1] =
	isect.v;
	config.varycoordImage[4 * (y * config.width + x) + 2] = 0.0f;
	config.varycoordImage[4 * (y * config.width + x) + 3] = 1.0f;

	unsigned int prim_id = isect.prim_id;

	float3 N;
	if (mesh.facevarying_normals.size() > 0) {
	float3 n0, n1, n2;
	n0[0] = mesh.facevarying_normals[9 * prim_id + 0];
	n0[1] = mesh.facevarying_normals[9 * prim_id + 1];
	n0[2] = mesh.facevarying_normals[9 * prim_id + 2];
	n1[0] = mesh.facevarying_normals[9 * prim_id + 3];
	n1[1] = mesh.facevarying_normals[9 * prim_id + 4];
	n1[2] = mesh.facevarying_normals[9 * prim_id + 5];
	n2[0] = mesh.facevarying_normals[9 * prim_id + 6];
	n2[1] = mesh.facevarying_normals[9 * prim_id + 7];
	n2[2] = mesh.facevarying_normals[9 * prim_id + 8];
	N = Lerp3(n0, n1, n2, isect.u, isect.v);
	} else {
	unsigned int f0, f1, f2;
	f0 = mesh.faces[3 * prim_id + 0];
	f1 = mesh.faces[3 * prim_id + 1];
	f2 = mesh.faces[3 * prim_id + 2];

	float3 v0, v1, v2;
	v0[0] = mesh.vertices[3 * f0 + 0];
	v0[1] = mesh.vertices[3 * f0 + 1];
	v0[2] = mesh.vertices[3 * f0 + 2];
	v1[0] = mesh.vertices[3 * f1 + 0];
	v1[1] = mesh.vertices[3 * f1 + 1];
	v1[2] = mesh.vertices[3 * f1 + 2];
	v2[0] = mesh.vertices[3 * f2 + 0];
	v2[1] = mesh.vertices[3 * f2 + 1];
	v2[2] = mesh.vertices[3 * f2 + 2];
	CalcNormal(N, v0, v1, v2);
	}

	config.normalImage[4 * (y * config.width + x) + 0] =
	0.5f * N[0] + 0.5f;
	config.normalImage[4 * (y * config.width + x) + 1] =
	0.5f * N[1] + 0.5f;
	config.normalImage[4 * (y * config.width + x) + 2] =
	0.5f * N[2] + 0.5f;
	config.normalImage[4 * (y * config.width + x) + 3] = 1.0f;

	config.depthImage[4 * (y * config.width + x) + 0] =
	isect.t;
	config.depthImage[4 * (y * config.width + x) + 1] =
	isect.t;
	config.depthImage[4 * (y * config.width + x) + 2] =
	isect.t;
	config.depthImage[4 * (y * config.width + x) + 3] = 1.0f;

	float3 UV;
	if (mesh.facevarying_uvs.size() > 0) {
	float3 uv0, uv1, uv2;
	uv0[0] = mesh.facevarying_uvs[6 * prim_id + 0];
	uv0[1] = mesh.facevarying_uvs[6 * prim_id + 1];
	uv1[0] = mesh.facevarying_uvs[6 * prim_id + 2];
	uv1[1] = mesh.facevarying_uvs[6 * prim_id + 3];
	uv2[0] = mesh.facevarying_uvs[6 * prim_id + 4];
	uv2[1] = mesh.facevarying_uvs[6 * prim_id + 5];

	UV = Lerp3(uv0, uv1, uv2, isect.u, isect.v);

	config.texcoordImage[4 * (y * config.width + x) + 0] = UV[0];
	config.texcoordImage[4 * (y * config.width + x) + 1] = UV[1];
	}

	// Fetch texture
	unsigned int material_id =
	mesh.material_ids[isect.prim_id];

	//printf("material_id=%d materials=%lld\n", material_id, materials.size());

	float diffuse_col[3];

	float specular_col[3];

	//tigra: material_id is ok
	if(material_id<materials.size())
	{
	//printf("ok mat\n");

	int diffuse_texid = materials[material_id].diffuse_texid;
	if (diffuse_texid >= 0) {
	FetchTexture(textures[diffuse_texid], UV[0], UV[1], diffuse_col);
	} else {
	diffuse_col[0] = materials[material_id].diffuse[0];
	diffuse_col[1] = materials[material_id].diffuse[1];
	diffuse_col[2] = materials[material_id].diffuse[2];
	}

	int specular_texid = materials[material_id].specular_texid;
	if (specular_texid >= 0) {
	FetchTexture(textures[specular_texid], UV[0], UV[1], specular_col);
	} else {
	specular_col[0] = materials[material_id].specular[0];
	specular_col[1] = materials[material_id].specular[1];
	specular_col[2] = materials[material_id].specular[2];
	}
	}
	else
	//tigra: wrong material_id, use default_material
	{

	//printf("default_material\n");

	diffuse_col[0] = default_material.diffuse[0];
	diffuse_col[1] = default_material.diffuse[1];
	diffuse_col[2] = default_material.diffuse[2];
	specular_col[0] = default_material.specular[0];
	specular_col[1] = default_material.specular[1];
	specular_col[2] = default_material.specular[2];
	}

	// Simple shading
	float NdotV = fabsf(vdot(N, dir));

	if (config.pass == 0) {
	rgba[4 * (y * config.width + x) + 0] = NdotV * diffuse_col[0];
	rgba[4 * (y * config.width + x) + 1] = NdotV * diffuse_col[1];
	rgba[4 * (y * config.width + x) + 2] = NdotV * diffuse_col[2];
	rgba[4 * (y * config.width + x) + 3] = 1.0f;
	sample_counts[y * config.width + x] =
	1; // Set 1 for the first pass
	} else { // additive.
	rgba[4 * (y * config.width + x) + 0] += NdotV * diffuse_col[0];
	rgba[4 * (y * config.width + x) + 1] += NdotV * diffuse_col[1];
	rgba[4 * (y * config.width + x) + 2] += NdotV * diffuse_col[2];
	rgba[4 * (y * config.width + x) + 3] += 1.0f;
	sample_counts[y * config.width + x]++;
	}

	} else {
	{
	if (config.pass == 0) {
	// clear pixel
	rgba[4 * (y * config.width + x) + 0] = 0.0f;
	rgba[4 * (y * config.width + x) + 1] = 0.0f;
	rgba[4 * (y * config.width + x) + 2] = 0.0f;
	rgba[4 * (y * config.width + x) + 3] = 0.0f;
	aux_rgba[4 * (y * config.width + x) + 0] = 0.0f;
	aux_rgba[4 * (y * config.width + x) + 1] = 0.0f;
	aux_rgba[4 * (y * config.width + x) + 2] = 0.0f;
	aux_rgba[4 * (y * config.width + x) + 3] = 0.0f;
	sample_counts[y * config.width + x] =
	1; // Set 1 for the first pass
	} else {
	sample_counts[y * config.width + x]++;
	}

	// No super sampling
	config.normalImage[4 * (y * config.width + x) + 0] = 0.0f;
	config.normalImage[4 * (y * config.width + x) + 1] = 0.0f;
	config.normalImage[4 * (y * config.width + x) + 2] = 0.0f;
	config.normalImage[4 * (y * config.width + x) + 3] = 0.0f;
	config.positionImage[4 * (y * config.width + x) + 0] = 0.0f;
	config.positionImage[4 * (y * config.width + x) + 1] = 0.0f;
	config.positionImage[4 * (y * config.width + x) + 2] = 0.0f;
	config.positionImage[4 * (y * config.width + x) + 3] = 0.0f;
	config.depthImage[4 * (y * config.width + x) + 0] = 0.0f;
	config.depthImage[4 * (y * config.width + x) + 1] = 0.0f;
	config.depthImage[4 * (y * config.width + x) + 2] = 0.0f;
	config.depthImage[4 * (y * config.width + x) + 3] = 0.0f;
	config.texcoordImage[4 * (y * config.width + x) + 0] = 0.0f;
	config.texcoordImage[4 * (y * config.width + x) + 1] = 0.0f;
	config.texcoordImage[4 * (y * config.width + x) + 2] = 0.0f;
	config.texcoordImage[4 * (y * config.width + x) + 3] = 0.0f;
	config.varycoordImage[4 * (y * config.width + x) + 0] = 0.0f;
	config.varycoordImage[4 * (y * config.width + x) + 1] = 0.0f;
	config.varycoordImage[4 * (y * config.width + x) + 2] = 0.0f;
	config.varycoordImage[4 * (y * config.width + x) + 3] = 0.0f;
	}
	}
	}

	for (int x = 0; x < config.width; x++) {
	aux_rgba[4 * (y * config.width + x) + 0] = 0.0f;
	aux_rgba[4 * (y * config.width + x) + 1] = 0.0f;
	aux_rgba[4 * (y * config.width + x) + 2] = 0.0f;
	aux_rgba[4 * (y * config.width + x) + 3] = 0.0f;
	}
	}
	}));
	}

	for (auto& t : workers) {
	t.join();
	}

	return (!cancelFlag);
	};

	} // namespace example