clray

annotate src/rt.cc @ 16:9e4a28063394

cl compiler segfaults...
author John Tsiombikas <nuclear@member.fsf.org>
date Mon, 09 Aug 2010 04:18:21 +0100
parents 754faf15ba36
children 4b1604f9798a
rev   line source
nuclear@0 1 #include <stdio.h>
nuclear@8 2 #include <string.h>
nuclear@2 3 #include <math.h>
nuclear@0 4 #include <assert.h>
John@14 5 #include "ogl.h"
nuclear@0 6 #include "ocl.h"
nuclear@9 7 #include "mesh.h"
nuclear@0 8
nuclear@12 9 // kernel arguments
nuclear@12 10 enum {
nuclear@12 11 KARG_FRAMEBUFFER,
nuclear@12 12 KARG_RENDER_INFO,
nuclear@12 13 KARG_FACES,
nuclear@12 14 KARG_MATLIB,
nuclear@12 15 KARG_LIGHTS,
nuclear@12 16 KARG_PRIM_RAYS,
nuclear@12 17 KARG_XFORM,
John@14 18 KARG_INVTRANS_XFORM,
John@15 19 KARG_OUTFACES, /* DBG */
John@14 20
John@14 21 NUM_KERNEL_ARGS
nuclear@12 22 };
John@11 23
nuclear@2 24 struct RendInfo {
nuclear@2 25 int xsz, ysz;
nuclear@9 26 int num_faces, num_lights;
nuclear@2 27 int max_iter;
nuclear@16 28 float ambient[4];
John@15 29 int dbg;
nuclear@12 30 };
nuclear@2 31
nuclear@1 32 struct Ray {
nuclear@8 33 float origin[4], dir[4];
nuclear@16 34 float energy;
nuclear@12 35 };
nuclear@1 36
nuclear@3 37 struct Light {
nuclear@8 38 float pos[4], color[4];
nuclear@12 39 };
nuclear@1 40
nuclear@3 41 static Ray get_primary_ray(int x, int y, int w, int h, float vfov_deg);
nuclear@13 42 static Face *create_face_buffer(Mesh **meshes, int num_meshes);
nuclear@3 43
nuclear@13 44 static Face *faces;
nuclear@3 45 static Ray *prim_rays;
nuclear@3 46 static CLProgram *prog;
nuclear@3 47 static int global_size;
nuclear@3 48
nuclear@4 49 static Light lightlist[] = {
nuclear@16 50 {{-10, 13, -20, 0}, {1, 1, 1, 1}}
nuclear@4 51 };
nuclear@4 52
nuclear@7 53
nuclear@4 54 static RendInfo rinf;
nuclear@4 55
nuclear@4 56
nuclear@13 57 bool init_renderer(int xsz, int ysz, Scene *scn)
nuclear@0 58 {
nuclear@4 59 // render info
nuclear@16 60 rinf.ambient[0] = rinf.ambient[1] = rinf.ambient[2] = 0.075;
nuclear@16 61 rinf.ambient[3] = 0.0;
nuclear@16 62
nuclear@4 63 rinf.xsz = xsz;
nuclear@4 64 rinf.ysz = ysz;
nuclear@13 65 rinf.num_faces = scn->get_num_faces();
nuclear@4 66 rinf.num_lights = sizeof lightlist / sizeof *lightlist;
nuclear@4 67 rinf.max_iter = 6;
John@15 68 rinf.dbg = 8;
nuclear@4 69
nuclear@3 70 /* calculate primary rays */
nuclear@3 71 prim_rays = new Ray[xsz * ysz];
nuclear@2 72
nuclear@2 73 for(int i=0; i<ysz; i++) {
nuclear@2 74 for(int j=0; j<xsz; j++) {
nuclear@2 75 prim_rays[i * xsz + j] = get_primary_ray(j, i, xsz, ysz, 45.0);
nuclear@2 76 }
nuclear@0 77 }
nuclear@0 78
nuclear@2 79 /* setup opencl */
nuclear@3 80 prog = new CLProgram("render");
nuclear@3 81 if(!prog->load("rt.cl")) {
nuclear@8 82 return false;
nuclear@0 83 }
nuclear@0 84
nuclear@13 85 /*Face **/faces = create_face_buffer(&scn->meshes[0], scn->meshes.size());
nuclear@13 86 if(!faces) {
nuclear@13 87 fprintf(stderr, "failed to create face buffer\n");
nuclear@13 88 return false;
nuclear@13 89 }
nuclear@13 90
nuclear@3 91 /* setup argument buffers */
nuclear@12 92 prog->set_arg_buffer(KARG_FRAMEBUFFER, ARG_WR, xsz * ysz * 4 * sizeof(float));
nuclear@12 93 prog->set_arg_buffer(KARG_RENDER_INFO, ARG_RD, sizeof rinf, &rinf);
John@14 94 prog->set_arg_buffer(KARG_FACES, ARG_RD, rinf.num_faces * sizeof(Face), faces);
John@14 95 prog->set_arg_buffer(KARG_MATLIB, ARG_RD, scn->get_num_materials() * sizeof(Material), scn->get_materials());
nuclear@12 96 prog->set_arg_buffer(KARG_LIGHTS, ARG_RD, sizeof lightlist, lightlist);
nuclear@12 97 prog->set_arg_buffer(KARG_PRIM_RAYS, ARG_RD, xsz * ysz * sizeof *prim_rays, prim_rays);
nuclear@12 98 prog->set_arg_buffer(KARG_XFORM, ARG_RD, 16 * sizeof(float));
nuclear@12 99 prog->set_arg_buffer(KARG_INVTRANS_XFORM, ARG_RD, 16 * sizeof(float));
John@15 100 prog->set_arg_buffer(KARG_OUTFACES, ARG_WR, rinf.num_faces * sizeof(Face));
nuclear@12 101
John@14 102 if(prog->get_num_args() < NUM_KERNEL_ARGS) {
John@14 103 return false;
John@14 104 }
John@14 105
nuclear@16 106 if(!prog->build()) {
nuclear@16 107 return false;
nuclear@16 108 }
nuclear@16 109
nuclear@12 110 delete [] prim_rays;
nuclear@2 111
nuclear@3 112 global_size = xsz * ysz;
nuclear@3 113 return true;
nuclear@3 114 }
nuclear@3 115
nuclear@3 116 void destroy_renderer()
nuclear@3 117 {
nuclear@3 118 delete prog;
nuclear@3 119 }
nuclear@3 120
nuclear@3 121 bool render()
nuclear@3 122 {
nuclear@13 123 printf("Running kernel...");
nuclear@13 124 fflush(stdout);
nuclear@3 125 if(!prog->run(1, global_size)) {
nuclear@3 126 return false;
nuclear@0 127 }
nuclear@13 128 printf("done\n");
nuclear@0 129
John@15 130 /* DEBUG */
John@15 131 CLMemBuffer *dbgbuf = prog->get_arg_buffer(KARG_OUTFACES);
John@15 132 Face *outfaces = (Face*)map_mem_buffer(dbgbuf, MAP_RD);
John@15 133 for(int i=0; i<rinf.num_faces; i++) {
John@15 134 if(!(faces[i] == outfaces[i])) {
John@15 135 fprintf(stderr, "SKATA %d\n", i);
John@15 136 return false;
John@15 137 }
John@15 138 faces[i] = outfaces[i];
John@15 139 }
John@15 140 printf("equality test passed\n");
John@15 141 unmap_mem_buffer(dbgbuf);
John@15 142
John@15 143
nuclear@13 144 CLMemBuffer *mbuf = prog->get_arg_buffer(KARG_FRAMEBUFFER);
nuclear@12 145 void *fb = map_mem_buffer(mbuf, MAP_RD);
nuclear@13 146 if(!fb) {
nuclear@13 147 fprintf(stderr, "FAILED\n");
nuclear@13 148 return false;
nuclear@13 149 }
nuclear@13 150
nuclear@12 151 glTexSubImage2D(GL_TEXTURE_2D, 0, 0, 0, rinf.xsz, rinf.ysz, GL_RGBA, GL_FLOAT, fb);
nuclear@2 152 unmap_mem_buffer(mbuf);
nuclear@3 153 return true;
nuclear@0 154 }
nuclear@2 155
John@15 156 void dbg_set_dbg(int dbg)
John@15 157 {
John@15 158 printf("setting dbg: %d\n", dbg);
John@15 159
John@15 160 CLMemBuffer *mbuf = prog->get_arg_buffer(KARG_RENDER_INFO);
John@15 161 RendInfo *rinf = (RendInfo*)map_mem_buffer(mbuf, MAP_WR);
John@15 162 rinf->dbg = dbg;
John@15 163 unmap_mem_buffer(mbuf);
John@15 164 }
John@15 165
nuclear@13 166 void dbg_render_gl(Scene *scn)
nuclear@8 167 {
John@15 168 float lpos[] = {-1, 1, 10, 0};
nuclear@12 169 glPushAttrib(GL_ENABLE_BIT | GL_TRANSFORM_BIT);
nuclear@8 170
nuclear@12 171 glDisable(GL_TEXTURE_2D);
nuclear@12 172 glEnable(GL_DEPTH_TEST);
John@15 173 glEnable(GL_LIGHTING);
John@15 174 glEnable(GL_LIGHT0);
John@15 175 glLightfv(GL_LIGHT0, GL_POSITION, lpos);
John@15 176 glEnable(GL_COLOR_MATERIAL);
nuclear@12 177
nuclear@12 178 glMatrixMode(GL_PROJECTION);
nuclear@12 179 glPushMatrix();
nuclear@12 180 glLoadIdentity();
nuclear@12 181 gluPerspective(45.0, (float)rinf.xsz / (float)rinf.ysz, 0.5, 1000.0);
nuclear@12 182
John@14 183 Material *materials = scn->get_materials();
John@14 184
nuclear@12 185 glBegin(GL_TRIANGLES);
nuclear@13 186 int num_faces = scn->get_num_faces();
nuclear@13 187 for(int i=0; i<num_faces; i++) {
John@14 188 Material *mat = materials ? materials + faces[i].matid : 0;
John@14 189
John@14 190 if(mat) {
John@14 191 glColor3f(mat->kd[0], mat->kd[1], mat->kd[2]);
John@14 192 } else {
John@14 193 glColor3f(1, 1, 1);
John@14 194 }
nuclear@12 195
nuclear@12 196 for(int j=0; j<3; j++) {
nuclear@12 197 float *pos = faces[i].v[j].pos;
John@15 198 float *norm = faces[i].normal;
John@15 199 glNormal3fv(norm);
John@15 200 glVertex3fv(pos);
nuclear@12 201 }
nuclear@12 202 }
nuclear@13 203
nuclear@13 204 /*for(size_t i=0; i<scn->meshes.size(); i++) {
nuclear@13 205 Material *mat = &scn->matlib[scn->meshes[i]->matid];
nuclear@13 206
nuclear@13 207 glColor3f(mat->kd[0], mat->kd[1], mat->kd[2]);
nuclear@13 208 for(size_t j=0; j<scn->meshes[i]->faces.size(); j++) {
nuclear@13 209 for(int k=0; k<3; k++) {
nuclear@13 210 float *pos = scn->meshes[i]->faces[j].v[k].pos;
nuclear@13 211 glVertex3f(pos[0], pos[1], pos[2]);
nuclear@13 212 }
nuclear@13 213 }
nuclear@13 214 }*/
nuclear@12 215 glEnd();
nuclear@12 216
nuclear@12 217 glPopMatrix();
nuclear@12 218 glPopAttrib();
nuclear@12 219 }
nuclear@12 220
nuclear@12 221 void set_xform(float *matrix, float *invtrans)
nuclear@12 222 {
nuclear@12 223 CLMemBuffer *mbuf_xform = prog->get_arg_buffer(KARG_XFORM);
nuclear@12 224 CLMemBuffer *mbuf_invtrans = prog->get_arg_buffer(KARG_INVTRANS_XFORM);
nuclear@12 225 assert(mbuf_xform && mbuf_invtrans);
nuclear@12 226
nuclear@12 227 float *mem = (float*)map_mem_buffer(mbuf_xform, MAP_WR);
nuclear@12 228 memcpy(mem, matrix, 16 * sizeof *mem);
nuclear@13 229 /*printf("-- xform:\n");
nuclear@12 230 for(int i=0; i<16; i++) {
nuclear@12 231 printf("%2.3f\t", mem[i]);
nuclear@12 232 if(i % 4 == 3) putchar('\n');
nuclear@13 233 }*/
nuclear@12 234 unmap_mem_buffer(mbuf_xform);
nuclear@12 235
nuclear@12 236 mem = (float*)map_mem_buffer(mbuf_invtrans, MAP_WR);
nuclear@12 237 memcpy(mem, invtrans, 16 * sizeof *mem);
nuclear@13 238 /*printf("-- inverse-transpose:\n");
nuclear@12 239 for(int i=0; i<16; i++) {
nuclear@12 240 printf("%2.3f\t", mem[i]);
nuclear@12 241 if(i % 4 == 3) putchar('\n');
nuclear@13 242 }*/
nuclear@12 243 unmap_mem_buffer(mbuf_invtrans);
nuclear@8 244 }
nuclear@8 245
nuclear@3 246 static Ray get_primary_ray(int x, int y, int w, int h, float vfov_deg)
nuclear@2 247 {
nuclear@2 248 float vfov = M_PI * vfov_deg / 180.0;
nuclear@2 249 float aspect = (float)w / (float)h;
nuclear@2 250
nuclear@2 251 float ysz = 2.0;
nuclear@2 252 float xsz = aspect * ysz;
nuclear@2 253
nuclear@2 254 float px = ((float)x / (float)w) * xsz - xsz / 2.0;
nuclear@2 255 float py = 1.0 - ((float)y / (float)h) * ysz;
nuclear@2 256 float pz = 1.0 / tan(0.5 * vfov);
nuclear@2 257
nuclear@4 258 px *= 100.0;
nuclear@4 259 py *= 100.0;
nuclear@4 260 pz *= 100.0;
nuclear@2 261
nuclear@16 262 Ray ray = {{0, 0, 0, 1}, {px, py, -pz, 1}, 1.0};
nuclear@2 263 return ray;
nuclear@2 264 }
nuclear@13 265
nuclear@13 266 static Face *create_face_buffer(Mesh **meshes, int num_meshes)
nuclear@13 267 {
nuclear@13 268 int num_faces = 0;
nuclear@13 269 for(int i=0; i<num_meshes; i++) {
nuclear@13 270 num_faces += meshes[i]->faces.size();
nuclear@13 271 }
nuclear@13 272 printf("constructing face buffer with %d faces (out of %d meshes)\n", num_faces, num_meshes);
nuclear@13 273
nuclear@13 274 Face *faces = new Face[num_faces];
nuclear@13 275 memset(faces, 0, num_faces * sizeof *faces);
nuclear@13 276 Face *fptr = faces;
nuclear@13 277
nuclear@13 278 for(int i=0; i<num_meshes; i++) {
nuclear@13 279 for(size_t j=0; j<meshes[i]->faces.size(); j++) {
nuclear@13 280 *fptr++ = meshes[i]->faces[j];
nuclear@13 281 }
nuclear@13 282 }
nuclear@13 283 return faces;
nuclear@13 284 }