32bpp_sse4.hpp

Go to the documentation of this file.
00001 /* $Id: 32bpp_sse4.hpp 26223 2014-01-03 18:43:10Z planetmaker $ */
00002 
00003 /*
00004  * This file is part of OpenTTD.
00005  * OpenTTD is free software; you can redistribute it and/or modify it under the terms of the GNU General Public License as published by the Free Software Foundation, version 2.
00006  * OpenTTD is distributed in the hope that it will be useful, but WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.
00007  * See the GNU General Public License for more details. You should have received a copy of the GNU General Public License along with OpenTTD. If not, see <http://www.gnu.org/licenses/>.
00008  */
00009 
00012 #ifndef BLITTER_32BPP_SSE4_HPP
00013 #define BLITTER_32BPP_SSE4_HPP
00014 
00015 #ifdef WITH_SSE
00016 
00017 #include "32bpp_ssse3.hpp"
00018 #include "smmintrin.h"
00019 
00020 #undef EXTR32
00021 #define EXTR32(from, rank) _mm_extract_epi32((*(um128i*) &from).m128i, rank)
00022 #undef INSR32
00023 #define INSR32(val, into, rank) (*(um128i*) &into).m128i = _mm_insert_epi32((*(um128i*) &into).m128i, val, rank)
00024 
00025 IGNORE_UNINITIALIZED_WARNING_START
00026 #ifdef _SQ64
00027   #undef INSR64
00028   #define INSR64(val, into, rank) (*(um128i*) &into).m128i = _mm_insert_epi64((*(um128i*) &into).m128i, val, rank)
00029 #else
00030   typedef union { uint64 u64; struct _u32 { uint32 low, high; } u32; } u6432;
00031   #undef INSR64
00032   #define INSR64(val, into, rank) { \
00033     u6432 v; \
00034     v.u64 = val; \
00035     (*(um128i*) &into).m128i = _mm_insert_epi32((*(um128i*) &into).m128i, v.u32.low, (rank)*2); \
00036     (*(um128i*) &into).m128i = _mm_insert_epi32((*(um128i*) &into).m128i, v.u32.high, (rank)*2 + 1); \
00037   }
00038 #endif
00039 IGNORE_UNINITIALIZED_WARNING_STOP
00040 
00042 class Blitter_32bppSSE4 : public Blitter_32bppSSSE3 {
00043 public:
00044   Colour AdjustBrightness(Colour colour, uint8 brightness);
00045   static Colour ReallyAdjustBrightness(Colour colour, uint8 brightness);
00046 
00047   /* virtual */ void Draw(Blitter::BlitterParams *bp, BlitterMode mode, ZoomLevel zoom);
00048   template <BlitterMode mode, Blitter_32bppSSE_Base::ReadMode read_mode, Blitter_32bppSSE_Base::BlockType bt_last>
00049   void Draw(const Blitter::BlitterParams *bp, ZoomLevel zoom);
00050   /* virtual */ const char *GetName() { return "32bpp-sse4"; }
00051 };
00052 
00054 class FBlitter_32bppSSE4: public BlitterFactory {
00055 public:
00056   FBlitter_32bppSSE4() : BlitterFactory("32bpp-sse4", "32bpp SSE4 Blitter (no palette animation)", HasCPUIDFlag(1, 2, 19)) {}
00057   /* virtual */ Blitter *CreateInstance() { return new Blitter_32bppSSE4(); }
00058 };
00059 
00060 #endif /* WITH_SSE */
00061 #endif /* BLITTER_32BPP_SSE4_HPP */