pyrit: comparison include/vector.h

equal deleted inserted replaced

-:9d66d323c354
+:9af5c039b678
 /*
 * vector.h: Vector class with Colour alias
 *
 * This file is part of Pyrit Ray Tracer.
 *
-* Copyright 2006, 2007  Radek Brich
+* Copyright 2006, 2007, 2008  Radek Brich
 *
 * Permission is hereby granted, free of charge, to any person obtaining a copy
 * of this software and associated documentation files (the "Software"), to deal
 * in the Software without restriction, including without limitation the rights
 * to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
 #include <math.h>
 #include <iostream>
 #include "common.h"
+#include "simd.h"
 using namespace std;
 /**
 * three cell vector
 class Vector
 {
 public:
 	// data
 	union {
-#ifndef NO_SSE
+#ifndef NO_SIMD
-		__m128 mps;
+		mfloat4 mf4;
 #endif
 		Float cell[4];
 		struct { Float x, y, z, w; };
 		struct { Float r, g, b, a; };
 	};
 	// constructors
-#ifndef NO_SSE
+#ifndef NO_SIMD
-	Vector(__m128 m): mps(m) {};
+	Vector(mfloat4 m): mf4(m) {};
 #endif
 	Vector(): x(0.0f), y(0.0f), z(0.0f), w(1.0) {};
 	Vector(Float ax, Float ay, Float az): x(ax), y(ay), z(az), w(1.0) {};
 	// index operator
 	const Float &operator[](int index) const { return cell[index]; };
+	Float &operator[](int index) { return cell[index]; };
-	bool operator==(Vector &v) const { return x==v.x && y==v.y && z==v.z; };
+	bool operator==(const Vector &v) const { return x==v.x && y==v.y && z==v.z; };
 	// normalize
 	Vector normalize()
 	{
 		const Float f = 1.0f / mag();
 	Vector operator-() const { return Vector(-x, -y, -z); };
 	// accumulate
 	Vector operator+=(const Vector &v)
 	{
-#ifdef NO_SSE
+#ifdef NO_SIMD
 		x += v.x;
 		y += v.y;
 		z += v.z;
 #else
-		mps = _mm_add_ps(mps, v.mps);
+		mf4 = madd(mf4, v.mf4);
 #endif
 		return *this;
 	};
 	// multiply
 	// cut
 	Vector operator/=(const Float &f)
 	{
-		Float finv = 1./f;
+		Float finv = 1.0f / f;
 		x *= finv;
 		y *= finv;
 		z *= finv;
 		return *this;
 	};
 	// sum
 	friend Vector operator+(const Vector &a, const Vector &b)
 	{
-#ifdef NO_SSE
+#ifdef NO_SIMD
 		return Vector(a.x + b.x, a.y + b.y, a.z + b.z);
 #else
-		return Vector(_mm_add_ps(a.mps, b.mps));
+		return Vector(madd(a.mf4, b.mf4));
 #endif
 	};
 	// difference
 	friend Vector operator-(const Vector &a, const Vector &b)
 	{
-#ifdef NO_SSE
+#ifdef NO_SIMD
 		return Vector(a.x - b.x, a.y - b.y, a.z - b.z);
 #else
-		return Vector(_mm_sub_ps(a.mps, b.mps));
+		return Vector(msub(a.mf4, b.mf4));
 #endif
 	};
 	// dot product
 	friend Float dot(const Vector &a, const Vector &b)
 	};
 	// scalar division
 	friend Vector operator/(const Vector &v, const Float &f)
 	{
-		const Float finv = 1./f;
+		const Float finv = 1.0f / f;
 		return Vector(v.x * finv, v.y * finv, v.z * finv);
 	};
 	friend Vector operator/(const Float &f, const Vector &v)
 	{
-#ifdef NO_SSE
+#ifdef NO_SIMD
 		return Vector(f / v.x, f / v.y, f / v.z);
 #else
-		return Vector(_mm_div_ps(_mm_set_ps1(f), v.mps));
+		return Vector(mdiv(mset1(f), v.mf4));
 #endif
 	};
 	// vector plus scalar
 	friend Vector operator+(const Vector &v, const Float &f)
 	};
 	// cell by cell product (only usable for colours)
 	friend Vector operator*(const Vector &a,  const Vector &b)
 	{
-#ifdef NO_SSE
+#ifdef NO_SIMD
 		return Vector(a.x * b.x, a.y * b.y, a.z * b.z);
 #else
-		return Vector(_mm_mul_ps(a.mps, b.mps));
+		return Vector(mmul(a.mf4, b.mf4));
 #endif
 	};
 	// write
 	friend ostream & operator<<(ostream &st, const Vector &v)
 	};
 };
 typedef Vector Colour;
-#ifndef NO_SSE
+#ifndef NO_SIMD
 class VectorPacket
 {
 public:
 	union {
-		__m128 ma[3];
+		mfloat4 ma[3];
 		struct {
-			__m128 mx;
+			mfloat4 mx;
-			__m128 my;
+			mfloat4 my;
-			__m128 mz;
+			mfloat4 mz;
 		};
 		struct {
 			float x[4];
 			float y[4];
 			float z[4];
 		};
 	};
 	VectorPacket() {};
-	VectorPacket(__m128 ax, __m128 ay, __m128 az):
+	VectorPacket(mfloat4 ax, mfloat4 ay, mfloat4 az):
 		mx(ax), my(ay), mz(az) {};
 	VectorPacket(const Vector &v):
-		mx(_mm_set_ps1(v.x)), my(_mm_set_ps1(v.y)), mz(_mm_set_ps1(v.z)) {};
+		mx(mset1(v.x)), my(mset1(v.y)), mz(mset1(v.z)) {};
 	Vector getVector(int i) const
 	{
 		return Vector(x[i], y[i], z[i]);
 	};
 		x[i] = v.x; y[i] = v.y; z[i] = v.z;
 	};
 	void normalize()
 	{
-		__m128 m,x,y,z;
+		mfloat4 m,x,y,z;
-		x = _mm_mul_ps(mx, mx); // x*x
+		x = mmul(mx, mx); // x*x
-		y = _mm_mul_ps(my, my); // y*y
+		y = mmul(my, my); // y*y
-		z = _mm_mul_ps(mz, mz); // z*z
+		z = mmul(mz, mz); // z*z
-		m = _mm_add_ps(x, y);
+		m = madd(madd(x, y), z);     // x*x + y*y + z*z
-		m = _mm_add_ps(m, z);     // x*x + y*y + z*z
+		m = mdiv(mOne, msqrt(m));   // m = 1/sqrt(m)
-		m = _mm_sqrt_ps(m);
+		mx = mmul(mx, m);
-		m = _mm_div_ps(mOne, m);   // m = 1/sqrt(m)
+		my = mmul(my, m);
-		mx = _mm_mul_ps(mx, m);
+		mz = mmul(mz, m);
-		my = _mm_mul_ps(my, m);
-		mz = _mm_mul_ps(mz, m);
 	};
 	// accumulate
 	VectorPacket operator+=(const VectorPacket &v)
 	{
-		mx = _mm_add_ps(mx, v.mx);
+		mx = madd(mx, v.mx);
-		my = _mm_add_ps(my, v.my);
+		my = madd(my, v.my);
-		mz = _mm_add_ps(mz, v.mz);
+		mz = madd(mz, v.mz);
 		return *this;
 	};
 	// add to non-masked components
-	VectorPacket selectiveAdd(__m128 mask, const VectorPacket &v)
+	VectorPacket selectiveAdd(const mfloat4 &mask, const VectorPacket &v)
 	{
-		mx = _mm_or_ps(_mm_and_ps(mask, _mm_add_ps(mx, v.mx)),
+		mx = mselect(mask, madd(mx, v.mx), mx);
-			_mm_andnot_ps(mask, mx));
+		my = mselect(mask, madd(my, v.my), my);
-		my = _mm_or_ps(_mm_and_ps(mask, _mm_add_ps(my, v.my)),
+		mz = mselect(mask, madd(mz, v.mz), mz);
-			_mm_andnot_ps(mask, my));
-		mz = _mm_or_ps(_mm_and_ps(mask, _mm_add_ps(mz, v.mz)),
-			_mm_andnot_ps(mask, mz));
 		return *this;
 	};
 	// add scalar to non-masked components
-	VectorPacket selectiveAdd(__m128 mask, const __m128 m)
+	VectorPacket selectiveAdd(const mfloat4 &mask, const mfloat4 &m)
 	{
-		mx = _mm_or_ps(_mm_and_ps(mask, _mm_add_ps(mx, m)),
+		mx = mselect(mask, madd(mx, m), mx);
-			_mm_andnot_ps(mask, mx));
+		my = mselect(mask, madd(my, m), my);
-		my = _mm_or_ps(_mm_and_ps(mask, _mm_add_ps(my, m)),
+		mz = mselect(mask, madd(mz, m), mz);
-			_mm_andnot_ps(mask, my));
-		mz = _mm_or_ps(_mm_and_ps(mask, _mm_add_ps(mz, m)),
-			_mm_andnot_ps(mask, mz));
 		return *this;
 	};
 	// dot product
-	friend __m128 dot(const VectorPacket &a, const VectorPacket &b)
+	friend mfloat4 dot(const VectorPacket &a, const VectorPacket &b)
 	{
-		return _mm_add_ps(_mm_add_ps(
+		return madd(madd(
-			_mm_mul_ps(a.mx, b.mx),
+			mmul(a.mx, b.mx),
-			_mm_mul_ps(a.my, b.my)),
+			mmul(a.my, b.my)),
-			_mm_mul_ps(a.mz, b.mz));
+			mmul(a.mz, b.mz));
 	};
 	friend VectorPacket operator+(const VectorPacket &a, const VectorPacket &b)
 	{
 		return VectorPacket(
-			_mm_add_ps(a.mx, b.mx),
+			madd(a.mx, b.mx),
-			_mm_add_ps(a.my, b.my),
+			madd(a.my, b.my),
-			_mm_add_ps(a.mz, b.mz));
+			madd(a.mz, b.mz));
 	};
 	friend VectorPacket operator-(const VectorPacket &a, const VectorPacket &b)
 	{
 		return VectorPacket(
-			_mm_sub_ps(a.mx, b.mx),
+			msub(a.mx, b.mx),
-			_mm_sub_ps(a.my, b.my),
+			msub(a.my, b.my),
-			_mm_sub_ps(a.mz, b.mz));
+			msub(a.mz, b.mz));
 	};
-	friend VectorPacket operator*(const VectorPacket &v,  const __m128 &m)
+	friend VectorPacket operator*(const VectorPacket &v,  const mfloat4 &m)
 	{
 		return VectorPacket(
-			_mm_mul_ps(v.mx, m),
+			mmul(v.mx, m),
-			_mm_mul_ps(v.my, m),
+			mmul(v.my, m),
-			_mm_mul_ps(v.mz, m));
+			mmul(v.mz, m));
 	};
-	friend VectorPacket operator/(const __m128 &m, const VectorPacket &v)
+	friend VectorPacket operator/(const mfloat4 &m, const VectorPacket &v)
 	{
 		return VectorPacket(
-			_mm_div_ps(m, v.mx),
+			mdiv(m, v.mx),
-			_mm_div_ps(m, v.my),
+			mdiv(m, v.my),
-			_mm_div_ps(m, v.mz));
+			mdiv(m, v.mz));
 	};
 	// cell by cell product (only usable for colours)
 	friend VectorPacket operator*(const VectorPacket &a,  const VectorPacket &b)
 	{
 		return VectorPacket(
-			_mm_mul_ps(a.mx, b.mx),
+			mmul(a.mx, b.mx),
-			_mm_mul_ps(a.my, b.my),
+			mmul(a.my, b.my),
-			_mm_mul_ps(a.mz, b.mz));
+			mmul(a.mz, b.mz));
 	};
 	// write to character stream
 	friend ostream & operator<<(ostream &st, const VectorPacket &v)
 	{

branch	pyrit
changeset 92	9af5c039b678
parent 91	9d66d323c354
child 93	96d65f841791