Members/kono/Cerium: Renderer/Engine/spe/DrawSpan.cc comparison

comparison Renderer/Engine/spe/DrawSpan.cc @ 775:97a514cf6ad3 before-simple-task

simd

author	yutaka@henri.cr.ie.u-ryukyu.ac.jp
date	Tue, 16 Feb 2010 15:09:54 +0900
parents	dc26593f8c40
children	4455e7b0caf3

comparison

equal deleted inserted replaced

-:5102e1751d6f
+:97a514cf6ad3
 static    int infinity_light_calc(int color,float normal_x, float normal_y, float normal_z,
 SchedTask *smanager,int x, int y, float z, int world_x, int world_y, float world_z);
-void
-normalize(vector float *v0, vector float *v1)
+static inline void
-{
+normalize(vector float& v0, vector float& v1)
-float norm;
+{
-float ret[4] __attribute__((aligned(16)));
+float norm;
-vector float *vret = (vector float *) ret;
+vector float ret __attribute__((aligned(16))) = {0,0,0,0};
-*vret = spu_mul(*v0,*v1);
+ret = spu_mul(v0,v1);
 norm = (ret[0] + ret[1] + ret[2]);
-*vret = (vector float)spu_splats(norm);
+ret = (vector float)spu_splats(norm);
-*vret = spu_rsqrte(*vret);
+ret = spu_rsqrte(ret);
-*v0 = spu_mul(*v1,*vret);
+v0 = spu_mul(v1,ret);
 }
-static float
+static inline float
-innerProduct1(vector float *v0, vector float *v1)
+innerProduct1(vector float& v0, vector float& v1)
 {
-float ret[4] __attribute__((aligned(16)));
+vector float ret __attribute__((aligned(16))) = {0,0,0,0};
 float inner;
-vector float *vret = (vector float *) ret;
+ret = spu_mul(v0,v1);
-*vret = spu_mul(*v0,*v1);
+inner = (ret[0] + ret[1] + ret[2]);
-inner = (ret[0] + ret[1] + ret[2]);
+if (inner < 0) {
-if (inner < 0) {
+inner = 0;
-inner = 0;
+}
-}
+return inner;
-return inner;
+}
-}
 /**
 * テクスチャは、TEXTURE_SPLIT_PIXEL^2 のブロックに分割する
 rgb[1] = (color & 0x0000ff00) >> 8;
 rgb[0] = (color & 0x000000ff);
 #endif
+vector float *light_xyz = (vector float*)smanager->global_get(Light);
 vector float v_rgb __attribute__((aligned(16))) = {(float)rgb[0],(float)rgb[1],(float)rgb[2],0};
-int light_rgb;
+vector float normal_vector __attribute__((aligned(16))) = {normal_x,normal_y,normal_z,0};
-float normal_vector[4] __attribute__((aligned(16))) = {normal_x,normal_y,normal_z,0};
+vector float light_vector __attribute__((aligned(16))) = {0,0,0,0};
-vector float *vnormal_vector = (vector float *) normal_vector;
-float light_vector[4];
-vector float *vlight_vector = (vector float *) light_vector;
-float inner_product;
-float *light_xyz = (float*)smanager->global_get(Light);
-vector float *vlight_xyz = (vector float *) light_xyz;
 vector float v_inner __attribute__((aligned(16)));
 vector float v_world[4] __attribute__((aligned(16))) = {{world_x, world_y, -world_z, 0},
 {world_x, world_y, -world_z, 0},
 {world_x, world_y, -world_z, 0},
 {0,       0,        0,       0}};
-normalize(vnormal_vector, vnormal_vector);
+int light_rgb;
+float inner_product;
-float tmp_rgb[4] __attribute__((aligned(16))) = {0,0,0,0};
+normalize(normal_vector, normal_vector);
-vector float *vtmp_rgb = (vector float *) tmp_rgb;
+vector float vtmp_rgb __attribute__((aligned(16))) = {0,0,0,0};
 int light_num = 4;
 for (int i = 0; i < light_num; i++) {
-*vlight_vector = spu_sub(v_world[i],vlight_xyz[i]);
+light_vector = spu_sub(v_world[i],light_xyz[i]);
-normalize(vlight_vector, vlight_vector);
+normalize(light_vector, light_vector);
-inner_product = innerProduct1(vnormal_vector,vlight_vector);
+inner_product = innerProduct1(normal_vector,light_vector);
 v_inner = spu_splats(inner_product);
-*vtmp_rgb = spu_madd(v_rgb,v_inner,*vtmp_rgb);
+vtmp_rgb = spu_madd(v_rgb,v_inner,vtmp_rgb);
 }
 vector unsigned int v_flag __attribute__((aligned(16)));
-vector float max_rgb __attribute__((aligned(16))) = (vector float)spu_splats((float)255);
+vector float max_rgb __attribute__((aligned(16))) = (vector float)spu_splats((float)255.0f);
-v_flag = spu_cmpgt(max_rgb,*vtmp_rgb);
+v_flag = spu_cmpgt(max_rgb,vtmp_rgb);
-*vtmp_rgb = spu_sel(max_rgb,*vtmp_rgb,v_flag);
+vtmp_rgb = spu_sel(max_rgb,vtmp_rgb,v_flag);
-vector unsigned int vlast_rgb __attribute__((aligned(16)));
+vector unsigned int last_rgb __attribute__((aligned(16)));
-vlast_rgb = spu_convtu(*vtmp_rgb,0);
+last_rgb = spu_convtu(vtmp_rgb,0);
-unsigned int *last_rgb = (unsigned int*) &vlast_rgb;
 //計算した rgb を light_rgb にまとめる。
 #if LITTLEENDIAN
 light_rgb = (last_rgb[0] << 24) + (last_rgb[1] << 16) + (last_rgb[2] << 8) + (last_rgb[3]);

Mercurial > hg > Members > kono > Cerium

comparison Renderer/Engine/spe/DrawSpan.cc @ 775:97a514cf6ad3 before-simple-task