123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770771772773774775776777778779780781782783784785786787788789790791792793794795796797798799800801802803804805806807808809810811812813814815816817818819820821822823824825826827828829830831832833834835836837838839840841842843844845846847848849850851852853854855856857858859860861862863864865866867868869870871872873874875876877878879880881882883 |
- /*
- LICENSE
- -------
- Copyright 2005 Nullsoft, Inc.
- All rights reserved.
- Redistribution and use in source and binary forms, with or without modification,
- are permitted provided that the following conditions are met:
- * Redistributions of source code must retain the above copyright notice,
- this list of conditions and the following disclaimer.
- * Redistributions in binary form must reproduce the above copyright notice,
- this list of conditions and the following disclaimer in the documentation
- and/or other materials provided with the distribution.
- * Neither the name of Nullsoft nor the names of its contributors may be used to
- endorse or promote products derived from this software without specific prior written permission.
-
- THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS" AND ANY EXPRESS OR
- IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND
- FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR
- CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
- DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
- DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER
- IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT
- OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
- */
- // alphachannel safe 11/21/99
- #include <windows.h>
- #include <commctrl.h>
- #include "r_defs.h"
- #include "resource.h"
- #include "timing.h"
- #include "../Agave/Language/api_language.h"
- #ifndef LASER
- #define C_THISCLASS C_BlurClass
- #define MOD_NAME "Trans / Blur"
- static const int zero=0;
- class C_THISCLASS : public C_RBASE2 {
- protected:
- public:
- C_THISCLASS();
- virtual ~C_THISCLASS();
- virtual int render(char visdata[2][2][576], int isBeat, int *framebuffer, int *fbout, int w, int h);
- virtual char *get_desc() { static char desc[128]; return (!desc[0]?WASABI_API_LNGSTRING_BUF(IDS_TRANS_BLUR,desc,128):desc); }
- virtual HWND conf(HINSTANCE hInstance, HWND hwndParent);
- virtual void load_config(unsigned char *data, int len);
- virtual int save_config(unsigned char *data);
- virtual int smp_getflags() { return 1; }
- virtual int smp_begin(int max_threads, char visdata[2][2][576], int isBeat, int *framebuffer, int *fbout, int w, int h);
- virtual void smp_render(int this_thread, int max_threads, char visdata[2][2][576], int isBeat, int *framebuffer, int *fbout, int w, int h);
- virtual int smp_finish(char visdata[2][2][576], int isBeat, int *framebuffer, int *fbout, int w, int h); // return value is that of render() for fbstuff etc
- int enabled;
- int roundmode;
- };
- #define PUT_INT(y) data[pos]=(y)&255; data[pos+1]=(y>>8)&255; data[pos+2]=(y>>16)&255; data[pos+3]=(y>>24)&255
- #define GET_INT() (data[pos]|(data[pos+1]<<8)|(data[pos+2]<<16)|(data[pos+3]<<24))
- void C_THISCLASS::load_config(unsigned char *data, int len)
- {
- int pos=0;
- if (len-pos >= 4) { enabled=GET_INT(); pos+=4; }
- if (len-pos >= 4) { roundmode=GET_INT(); pos+=4; }
- else roundmode=0;
- }
- int C_THISCLASS::save_config(unsigned char *data)
- {
- int pos=0;
- PUT_INT(enabled); pos+=4;
- PUT_INT(roundmode); pos+=4;
- return pos;
- }
- C_THISCLASS::C_THISCLASS()
- {
- roundmode=0;
- enabled=1;
- }
- C_THISCLASS::~C_THISCLASS()
- {
- }
- #define MASK_SH1 (~(((1<<7)|(1<<15)|(1<<23))<<1))
- #define MASK_SH2 (~(((3<<6)|(3<<14)|(3<<22))<<2))
- #define MASK_SH3 (~(((7<<5)|(7<<13)|(7<<21))<<3))
- #define MASK_SH4 (~(((15<<4)|(15<<12)|(15<<20))<<4))
- static unsigned int mmx_mask1[2]={MASK_SH1,MASK_SH1};
- static unsigned int mmx_mask2[2]={MASK_SH2,MASK_SH2};
- static unsigned int mmx_mask3[2]={MASK_SH3,MASK_SH3};
- static unsigned int mmx_mask4[2]={MASK_SH4,MASK_SH4};
- #define DIV_2(x) ((( x ) & MASK_SH1)>>1)
- #define DIV_4(x) ((( x ) & MASK_SH2)>>2)
- #define DIV_8(x) ((( x ) & MASK_SH3)>>3)
- #define DIV_16(x) ((( x ) & MASK_SH4)>>4)
- void C_THISCLASS::smp_render(int this_thread, int max_threads, char visdata[2][2][576], int isBeat, int *framebuffer, int *fbout, int w, int h)
- {
- if (!enabled) return;
- timingEnter(0);
- unsigned int *f = (unsigned int *) framebuffer;
- unsigned int *of = (unsigned int *) fbout;
- if (max_threads < 1) max_threads=1;
- int start_l = ( this_thread * h ) / max_threads;
- int end_l;
- if (this_thread >= max_threads - 1) end_l = h;
- else end_l = ( (this_thread+1) * h ) / max_threads;
- int outh=end_l-start_l;
- if (outh<1) return;
- int skip_pix=start_l*w;
- f += skip_pix;
- of+= skip_pix;
- int at_top=0, at_bottom=0;
- if (!this_thread) at_top=1;
- if (this_thread >= max_threads - 1) at_bottom=1;
- if (enabled == 2)
- {
- // top line
- if (at_top)
- {
- unsigned int *f2=f+w;
- int x;
- int adj_tl=0, adj_tl2=0;
- if (roundmode) { adj_tl = 0x03030303; adj_tl2 = 0x04040404; }
- // top left
- *of++=DIV_2(f[0])+DIV_4(f[0])+DIV_8(f[1])+DIV_8(f2[0]) + adj_tl; f++; f2++;
- // top center
- x=(w-2)/4;
- while (x--)
- {
- of[0]=DIV_2(f[0]) + DIV_8(f[0]) + DIV_8(f[1]) + DIV_8(f[-1]) + DIV_8(f2[0]) + adj_tl2;
- of[1]=DIV_2(f[1]) + DIV_8(f[1]) + DIV_8(f[2]) + DIV_8(f[0]) + DIV_8(f2[1]) + adj_tl2;
- of[2]=DIV_2(f[2]) + DIV_8(f[2]) + DIV_8(f[3]) + DIV_8(f[1]) + DIV_8(f2[2]) + adj_tl2;
- of[3]=DIV_2(f[3]) + DIV_8(f[3]) + DIV_8(f[4]) + DIV_8(f[2]) + DIV_8(f2[3]) + adj_tl2;
- f+=4;
- f2+=4;
- of+=4;
- }
- x=(w-2)&3;
- while (x--)
- {
- *of++=DIV_2(f[0]) + DIV_8(f[0]) + DIV_8(f[1]) + DIV_8(f[-1]) + DIV_8(f2[0]) + adj_tl2;
- f++;
- f2++;
- }
- // top right
- *of++=DIV_2(f[0])+DIV_4(f[0]) + DIV_8(f[-1])+DIV_8(f2[0]) + adj_tl; f++; f2++;
- }
- // middle block
- {
- int y=outh-at_top-at_bottom;
- unsigned int adj_tl1=0,adj_tl2=0;
- unsigned __int64 adj2=0;
- if (roundmode) { adj_tl1=0x04040404; adj_tl2=0x05050505; adj2=0x0505050505050505i64; }
- while (y--)
- {
- int x;
- unsigned int *f2=f+w;
- unsigned int *f3=f-w;
-
- // left edge
- *of++=DIV_2(f[0])+DIV_8(f[0])+DIV_8(f[1])+DIV_8(f2[0])+DIV_8(f3[0])+adj_tl1; f++; f2++; f3++;
- // middle of line
- #ifdef NO_MMX
- x=(w-2)/4;
- if (roundmode)
- {
- while (x--)
- {
- of[0]=DIV_2(f[0]) + DIV_4(f[0]) + DIV_16(f[1]) + DIV_16(f[-1]) + DIV_16(f2[0]) + DIV_16(f3[0]) + 0x05050505;
- of[1]=DIV_2(f[1]) + DIV_4(f[1]) + DIV_16(f[2]) + DIV_16(f[0]) + DIV_16(f2[1]) + DIV_16(f3[1]) + 0x05050505;
- of[2]=DIV_2(f[2]) + DIV_4(f[2]) + DIV_16(f[3]) + DIV_16(f[1]) + DIV_16(f2[2]) + DIV_16(f3[2]) + 0x05050505;
- of[3]=DIV_2(f[3]) + DIV_4(f[3]) + DIV_16(f[4]) + DIV_16(f[2]) + DIV_16(f2[3]) + DIV_16(f3[3]) + 0x05050505;
- f+=4;
- f2+=4;
- f3+=4;
- of+=4;
- }
- }
- else
- {
- while (x--)
- {
- of[0]=DIV_2(f[0]) + DIV_4(f[0]) + DIV_16(f[1]) + DIV_16(f[-1]) + DIV_16(f2[0]) + DIV_16(f3[0]);
- of[1]=DIV_2(f[1]) + DIV_4(f[1]) + DIV_16(f[2]) + DIV_16(f[0]) + DIV_16(f2[1]) + DIV_16(f3[1]);
- of[2]=DIV_2(f[2]) + DIV_4(f[2]) + DIV_16(f[3]) + DIV_16(f[1]) + DIV_16(f2[2]) + DIV_16(f3[2]);
- of[3]=DIV_2(f[3]) + DIV_4(f[3]) + DIV_16(f[4]) + DIV_16(f[2]) + DIV_16(f2[3]) + DIV_16(f3[3]);
- f+=4;
- f2+=4;
- f3+=4;
- of+=4;
- }
- }
- #else
- {
- __asm
- {
- mov ecx, w
- mov edx, ecx
- mov ebx, edx
- neg ebx
- mov esi, f
- mov edi, of
- sub ecx, 2
- shr ecx, 2
- movq mm1, [esi-4]
- align 16
- mmx_light_blur_loop:
- movq mm0, [esi]
- movq mm2, [esi+4]
- pand mm0, mmx_mask1
- movq mm5, mm2
- psrl mm0, 1
- movq mm7, [esi+8]
- movq mm4, mm0
- pand mm1, mmx_mask4
- pand mm4, mmx_mask1
- movq mm3, [esi+edx*4]
- psrl mm4, 1
-
- paddb mm0, mm4
- pand mm2, mmx_mask4
- movq mm4, [esi+ebx*4]
- pand mm3, mmx_mask4
- pand mm4, mmx_mask4
- psrl mm1, 4
- pand mm7, mmx_mask1
- movq mm6, [esi+12]
- psrl mm2, 4
- add esi, 16
- psrl mm3, 4
- paddb mm0, mm1
- psrl mm4, 4
- movq mm1, mm6
- psrl mm7, 1
- paddb mm2, mm3
- paddb mm0, mm4
- movq mm3, [esi+edx*4-8]
- paddb mm0, mm2
- movq mm4, [esi+ebx*4-8]
- paddb mm0, [adj2]
- pand mm6, mmx_mask4
- movq [edi],mm0
- pand mm5, mmx_mask4
- movq mm0, mm7
- pand mm3, mmx_mask4
- psrl mm6, 4
- pand mm0, mmx_mask1
- pand mm4, mmx_mask4
- psrl mm5, 4
- psrl mm0, 1
- paddb mm7, mm6
- paddb mm7, mm0
- add edi, 16
- psrl mm3, 4
- psrl mm4, 4
- paddb mm5, mm3
- paddb mm7, mm4
- dec ecx
- paddb mm7, mm5
- paddb mm7, [adj2]
- movq [edi-8],mm7
-
- jnz mmx_light_blur_loop
- mov of, edi
- mov f, esi
- };
- f2=f+w; // update these bitches
- f3=f-w;
- }
- #endif
- x=(w-2)&3;
- while (x--)
- {
- *of++=DIV_2(f[0]) + DIV_4(f[0]) + DIV_16(f[1]) + DIV_16(f[-1]) + DIV_16(f2[0]) + DIV_16(f3[0]) + adj_tl2;
- f++;
- f2++;
- f3++;
- }
- // right block
- *of++=DIV_2(f[0])+DIV_8(f[0])+DIV_8(f[-1])+DIV_8(f2[0])+DIV_8(f3[0])+adj_tl1; f++;
- }
- }
- // bottom block
- if (at_bottom)
- {
- unsigned int *f2=f-w;
- int x;
- int adj_tl=0, adj_tl2=0;
- if (roundmode) { adj_tl = 0x03030303; adj_tl2 = 0x04040404; }
- // bottom left
- *of++=DIV_2(f[0])+DIV_4(f[0])+DIV_8(f[1])+DIV_8(f2[0]) + adj_tl; f++; f2++;
- // bottom center
- x=(w-2)/4;
- while (x--)
- {
- of[0]=DIV_2(f[0]) + DIV_8(f[0]) + DIV_8(f[1]) + DIV_8(f[-1]) + DIV_8(f2[0]) + adj_tl2;
- of[1]=DIV_2(f[1]) + DIV_8(f[1]) + DIV_8(f[2]) + DIV_8(f[0]) + DIV_8(f2[1]) + adj_tl2;
- of[2]=DIV_2(f[2]) + DIV_8(f[2]) + DIV_8(f[3]) + DIV_8(f[1]) + DIV_8(f2[2])+adj_tl2;
- of[3]=DIV_2(f[3]) + DIV_8(f[3]) + DIV_8(f[4]) + DIV_8(f[2]) + DIV_8(f2[3])+adj_tl2;
- f+=4;
- f2+=4;
- of+=4;
- }
- x=(w-2)&3;
- while (x--)
- {
- *of++=DIV_2(f[0]) + DIV_8(f[0]) + DIV_8(f[1]) + DIV_8(f[-1]) + DIV_8(f2[0])+adj_tl2;
- f++;
- f2++;
- }
- // bottom right
- *of++=DIV_2(f[0])+DIV_4(f[0]) + DIV_8(f[-1])+DIV_8(f2[0])+adj_tl; f++; f2++;
- }
- }
- else if (enabled == 3) // more blur
- {
- // top line
- if (at_top) {
- unsigned int *f2=f+w;
- int x;
- int adj_tl=0, adj_tl2=0;
- if (roundmode) { adj_tl = 0x02020202; adj_tl2 = 0x01010101; }
- // top left
- *of++=DIV_2(f[1])+DIV_2(f2[0]) + adj_tl2; f++; f2++;
- // top center
- x=(w-2)/4;
- while (x--)
- {
- of[0]=DIV_4(f[1]) + DIV_4(f[-1]) + DIV_2(f2[0]) + adj_tl;
- of[1]=DIV_4(f[2]) + DIV_4(f[0]) + DIV_2(f2[1]) +adj_tl;
- of[2]=DIV_4(f[3]) + DIV_4(f[1]) + DIV_2(f2[2]) + adj_tl;
- of[3]=DIV_4(f[4]) + DIV_4(f[2]) + DIV_2(f2[3]) + adj_tl;
- f+=4;
- f2+=4;
- of+=4;
- }
- x=(w-2)&3;
- while (x--)
- {
- *of++=DIV_4(f[1]) + DIV_4(f[-1]) + DIV_2(f2[0])+adj_tl;
- f++;
- f2++;
- }
- // top right
- *of++=DIV_2(f[-1])+DIV_2(f2[0])+adj_tl2; f++; f2++;
- }
- // middle block
- {
- int y=outh-at_top-at_bottom;
- int adj_tl1=0,adj_tl2=0;
- unsigned __int64 adj2=0;
- if (roundmode) { adj_tl1=0x02020202; adj_tl2=0x03030303; adj2=0x0303030303030303i64; }
- while (y--)
- {
- int x;
- unsigned int *f2=f+w;
- unsigned int *f3=f-w;
-
- // left edge
- *of++=DIV_2(f[1])+DIV_4(f2[0])+DIV_4(f3[0]) + adj_tl1; f++; f2++; f3++;
- // middle of line
- #ifdef NO_MMX
- x=(w-2)/4;
- if (roundmode)
- {
- while (x--)
- {
- of[0]=DIV_4(f[1]) + DIV_4(f[-1]) + DIV_4(f2[0]) + DIV_4(f3[0]) + 0x03030303;
- of[1]=DIV_4(f[2]) + DIV_4(f[0]) + DIV_4(f2[1]) + DIV_4(f3[1]) + 0x03030303;
- of[2]=DIV_4(f[3]) + DIV_4(f[1]) + DIV_4(f2[2]) + DIV_4(f3[2]) + 0x03030303;
- of[3]=DIV_4(f[4]) + DIV_4(f[2]) + DIV_4(f2[3]) + DIV_4(f3[3]) + 0x03030303;
- f+=4; f2+=4; f3+=4; of+=4;
- }
- }
- else
- {
- while (x--)
- {
- of[0]=DIV_4(f[1]) + DIV_4(f[-1]) + DIV_4(f2[0]) + DIV_4(f3[0]);
- of[1]=DIV_4(f[2]) + DIV_4(f[0]) + DIV_4(f2[1]) + DIV_4(f3[1]);
- of[2]=DIV_4(f[3]) + DIV_4(f[1]) + DIV_4(f2[2]) + DIV_4(f3[2]);
- of[3]=DIV_4(f[4]) + DIV_4(f[2]) + DIV_4(f2[3]) + DIV_4(f3[3]);
- f+=4; f2+=4; f3+=4; of+=4;
- }
- }
- #else
- {
- __asm
- {
- mov ecx, w
- mov edx, ecx
- mov ebx, edx
- neg ebx
- mov esi, f
- mov edi, of
- sub ecx, 2
- shr ecx, 2
- movq mm1, [esi-4]
- align 16
- mmx_heavy_blur_loop:
- movq mm2, [esi+4]
- pxor mm0, mm0
- movq mm5, mm2
- pxor mm7, mm7
- movq mm3, [esi+edx*4]
- pand mm1, mmx_mask2
- movq mm4, [esi+ebx*4]
- pand mm2, mmx_mask2
- pand mm3, mmx_mask2
- pand mm4, mmx_mask2
- psrl mm1, 2
- movq mm6, [esi+12]
- psrl mm2, 2
- psrl mm3, 2
- paddb mm0, mm1
- psrl mm4, 2
- movq mm1, mm6
- paddb mm2, mm3
- paddb mm0, mm4
- movq mm3, [esi+edx*4+8]
- paddb mm0, mm2
- movq mm4, [esi+ebx*4+8]
- paddb mm0, [adj2]
- pand mm6, mmx_mask2
- movq [edi],mm0
- pand mm5, mmx_mask2
- pand mm3, mmx_mask2
- add esi, 16
- psrl mm6, 2
- pand mm4, mmx_mask2
- psrl mm5, 2
- paddb mm7, mm6
- psrl mm3, 2
- add edi, 16
- psrl mm4, 2
- paddb mm5, mm3
- paddb mm7, mm4
- paddb mm7, mm5
- paddb mm7, [adj2]
- movq [edi-8],mm7
-
- dec ecx
- jnz mmx_heavy_blur_loop
- mov of, edi
- mov f, esi
- };
- f2=f+w; // update these bitches
- f3=f-w;
- }
- #endif
- x=(w-2)&3;
- while (x--)
- {
- *of++=DIV_4(f[1]) + DIV_4(f[-1]) + DIV_4(f2[0]) + DIV_4(f3[0]) + adj_tl2;
- f++;
- f2++;
- f3++;
- }
- // right block
- *of++=DIV_2(f[-1])+DIV_4(f2[0])+DIV_4(f3[0]) + adj_tl1; f++;
- }
- }
- // bottom block
- if (at_bottom)
- {
- unsigned int *f2=f-w;
- int x;
- int adj_tl=0, adj_tl2=0;
- if (roundmode) { adj_tl = 0x02020202; adj_tl2 = 0x01010101; }
- // bottom left
- *of++=DIV_2(f[1])+DIV_2(f2[0]) + adj_tl2; f++; f2++;
- // bottom center
- x=(w-2)/4;
- while (x--)
- {
- of[0]=DIV_4(f[1]) + DIV_4(f[-1]) + DIV_2(f2[0])+adj_tl;
- of[1]=DIV_4(f[2]) + DIV_4(f[0]) + DIV_2(f2[1])+adj_tl;
- of[2]=DIV_4(f[3]) + DIV_4(f[1]) + DIV_2(f2[2])+adj_tl;
- of[3]=DIV_4(f[4]) + DIV_4(f[2]) + DIV_2(f2[3])+adj_tl;
- f+=4;
- f2+=4;
- of+=4;
- }
- x=(w-2)&3;
- while (x--)
- {
- *of++=DIV_4(f[1]) + DIV_4(f[-1]) + DIV_2(f2[0])+adj_tl;
- f++;
- f2++;
- }
- // bottom right
- *of++=DIV_2(f[-1])+DIV_2(f2[0])+adj_tl2; f++; f2++;
- }
- }
- else
- {
- // top line
- if (at_top)
- {
- unsigned int *f2=f+w;
- int x;
- int adj_tl=0, adj_tl2=0;
- if (roundmode) { adj_tl = 0x02020202; adj_tl2 = 0x03030303; }
- // top left
- *of++=DIV_2(f[0])+DIV_4(f[1])+DIV_4(f2[0]) + adj_tl; f++; f2++;
- // top center
- x=(w-2)/4;
- while (x--)
- {
- of[0]=DIV_4(f[0]) + DIV_4(f[1]) + DIV_4(f[-1]) + DIV_4(f2[0]) + adj_tl2;
- of[1]=DIV_4(f[1]) + DIV_4(f[2]) + DIV_4(f[0]) + DIV_4(f2[1]) + adj_tl2;
- of[2]=DIV_4(f[2]) + DIV_4(f[3]) + DIV_4(f[1]) + DIV_4(f2[2]) + adj_tl2;
- of[3]=DIV_4(f[3]) + DIV_4(f[4]) + DIV_4(f[2]) + DIV_4(f2[3]) + adj_tl2;
- f+=4;
- f2+=4;
- of+=4;
- }
- x=(w-2)&3;
- while (x--)
- {
- *of++=DIV_4(f[0]) + DIV_4(f[1]) + DIV_4(f[-1]) + DIV_4(f2[0]) + adj_tl2;
- f++;
- f2++;
- }
- // top right
- *of++=DIV_2(f[0])+DIV_4(f[-1])+DIV_4(f2[0]) + adj_tl; f++; f2++;
- }
- // middle block
- {
- int y=outh-at_top-at_bottom;
- int adj_tl1=0,adj_tl2=0;
- unsigned __int64 adj2=0;
- if (roundmode) { adj_tl1=0x03030303; adj_tl2=0x04040404; adj2=0x0404040404040404i64; }
- while (y--)
- {
- int x;
- unsigned int *f2=f+w;
- unsigned int *f3=f-w;
-
- // left edge
- *of++=DIV_4(f[0])+DIV_4(f[1])+DIV_4(f2[0])+DIV_4(f3[0])+adj_tl1; f++; f2++; f3++;
- // middle of line
- #ifdef NO_MMX
- x=(w-2)/4;
- if (roundmode)
- {
- while (x--)
- {
- of[0]=DIV_2(f[0]) + DIV_8(f[1]) + DIV_8(f[-1]) + DIV_8(f2[0]) + DIV_8(f3[0]) + 0x04040404;
- of[1]=DIV_2(f[1]) + DIV_8(f[2]) + DIV_8(f[0]) + DIV_8(f2[1]) + DIV_8(f3[1]) + 0x04040404;
- of[2]=DIV_2(f[2]) + DIV_8(f[3]) + DIV_8(f[1]) + DIV_8(f2[2]) + DIV_8(f3[2]) + 0x04040404;
- of[3]=DIV_2(f[3]) + DIV_8(f[4]) + DIV_8(f[2]) + DIV_8(f2[3]) + DIV_8(f3[3]) + 0x04040404;
- f+=4; f2+=4; f3+=4; of+=4;
- }
- }
- else
- {
- while (x--)
- {
- of[0]=DIV_2(f[0]) + DIV_8(f[1]) + DIV_8(f[-1]) + DIV_8(f2[0]) + DIV_8(f3[0]);
- of[1]=DIV_2(f[1]) + DIV_8(f[2]) + DIV_8(f[0]) + DIV_8(f2[1]) + DIV_8(f3[1]);
- of[2]=DIV_2(f[2]) + DIV_8(f[3]) + DIV_8(f[1]) + DIV_8(f2[2]) + DIV_8(f3[2]);
- of[3]=DIV_2(f[3]) + DIV_8(f[4]) + DIV_8(f[2]) + DIV_8(f2[3]) + DIV_8(f3[3]);
- f+=4; f2+=4; f3+=4; of+=4;
- }
- }
- #else
- {
- __asm
- {
- mov ecx, w
- mov edx, ecx
- mov ebx, edx
- neg ebx
- mov esi, f
- mov edi, of
- sub ecx, 2
- shr ecx, 2
- movq mm1, [esi-4]
- align 16
- mmx_normal_blur_loop:
- movq mm0, [esi]
- movq mm2, [esi+4]
- pand mm0, mmx_mask1
- movq mm5, mm2
- movq mm7, [esi+8]
- pand mm1, mmx_mask3
- movq mm3, [esi+edx*4]
- pand mm2, mmx_mask3
- movq mm4, [esi+ebx*4]
- pand mm3, mmx_mask3
- psrl mm0, 1
- pand mm4, mmx_mask3
- psrl mm1, 3
- pand mm7, mmx_mask1
- movq mm6, [esi+12]
- psrl mm2, 3
- add esi, 16
- psrl mm3, 3
- paddb mm0, mm1
- psrl mm4, 3
- movq mm1, mm6
- paddb mm2, mm3
- paddb mm0, mm4
- movq mm3, [esi+edx*4-8]
- paddb mm0, mm2
- movq mm4, [esi+ebx*4-8]
- paddb mm0, [adj2]
- pand mm6, mmx_mask3
- movq [edi],mm0
- pand mm5, mmx_mask3
- psrl mm7, 1
- pand mm3, mmx_mask3
- psrl mm6, 3
- pand mm4, mmx_mask3
- psrl mm5, 3
- paddb mm7, mm6
- add edi, 16
- psrl mm3, 3
- psrl mm4, 3
- paddb mm5, mm3
- paddb mm7, mm4
- dec ecx
- paddb mm7, mm5
- paddb mm7, [adj2]
- movq [edi-8],mm7
-
- jnz mmx_normal_blur_loop
- mov of, edi
- mov f, esi
- };
- f2=f+w; // update these bitches
- f3=f-w;
- }
- #endif
- x=(w-2)&3;
- while (x--)
- {
- *of++=DIV_2(f[0]) + DIV_8(f[1]) + DIV_8(f[-1]) + DIV_8(f2[0]) + DIV_8(f3[0]) + adj_tl2;
- f++;
- f2++;
- f3++;
- }
- // right block
- *of++=DIV_4(f[0])+DIV_4(f[-1])+DIV_4(f2[0])+DIV_4(f3[0]) + adj_tl1; f++;
- }
- }
- // bottom block
- if (at_bottom)
- {
- unsigned int *f2=f-w;
- int adj_tl=0, adj_tl2=0;
- if (roundmode) { adj_tl = 0x02020202; adj_tl2 = 0x03030303; }
- int x;
- // bottom left
- *of++=DIV_2(f[0])+DIV_4(f[1])+DIV_4(f2[0]) + adj_tl; f++; f2++;
- // bottom center
- x=(w-2)/4;
- while (x--)
- {
- of[0]=DIV_4(f[0]) + DIV_4(f[1]) + DIV_4(f[-1]) + DIV_4(f2[0]) + adj_tl2;
- of[1]=DIV_4(f[1]) + DIV_4(f[2]) + DIV_4(f[0]) + DIV_4(f2[1]) + adj_tl2;
- of[2]=DIV_4(f[2]) + DIV_4(f[3]) + DIV_4(f[1]) + DIV_4(f2[2]) + adj_tl2;
- of[3]=DIV_4(f[3]) + DIV_4(f[4]) + DIV_4(f[2]) + DIV_4(f2[3]) + adj_tl2;
- f+=4;
- f2+=4;
- of+=4;
- }
- x=(w-2)&3;
- while (x--)
- {
- *of++=DIV_4(f[0]) + DIV_4(f[1]) + DIV_4(f[-1]) + DIV_4(f2[0]) + adj_tl2;
- f++;
- f2++;
- }
- // bottom right
- *of++=DIV_2(f[0])+DIV_4(f[-1])+DIV_4(f2[0]) + adj_tl; f++; f2++;
- }
- }
- #ifndef NO_MMX
- __asm emms;
- #endif
-
- timingLeave(0);
- }
- int C_THISCLASS::smp_begin(int max_threads, char visdata[2][2][576], int isBeat, int *framebuffer, int *fbout, int w, int h)
- {
- if (!enabled) return 0;
- return max_threads;
- }
- int C_THISCLASS::smp_finish(char visdata[2][2][576], int isBeat, int *framebuffer, int *fbout, int w, int h) // return value is that of render() for fbstuff etc
- {
- return !!enabled;
- }
- int C_THISCLASS::render(char visdata[2][2][576], int isBeat, int *framebuffer, int *fbout, int w, int h)
- {
- smp_begin(1,visdata,isBeat,framebuffer,fbout,w,h);
- if (isBeat & 0x80000000) return 0;
- smp_render(0,1,visdata,isBeat,framebuffer,fbout,w,h);
- return smp_finish(visdata,isBeat,framebuffer,fbout,w,h);
- }
- C_RBASE *R_Blur(char *desc)
- {
- if (desc) { strcpy(desc,MOD_NAME); return NULL; }
- return (C_RBASE *) new C_THISCLASS();
- }
- static C_THISCLASS *g_this;
- static BOOL CALLBACK g_DlgProc(HWND hwndDlg, UINT uMsg, WPARAM wParam,LPARAM lParam)
- {
- switch (uMsg)
- {
- case WM_INITDIALOG:
- if (g_this->enabled==2) CheckDlgButton(hwndDlg,IDC_RADIO3,BST_CHECKED);
- else if (g_this->enabled==3) CheckDlgButton(hwndDlg,IDC_RADIO4,BST_CHECKED);
- else if (g_this->enabled) CheckDlgButton(hwndDlg,IDC_RADIO2,BST_CHECKED);
- else CheckDlgButton(hwndDlg,IDC_RADIO1,BST_CHECKED);
- if (g_this->roundmode==0) CheckDlgButton(hwndDlg,IDC_ROUNDDOWN,BST_CHECKED);
- else CheckDlgButton(hwndDlg,IDC_ROUNDUP,BST_CHECKED);
- return 1;
- case WM_COMMAND:
- if (LOWORD(wParam) == IDC_RADIO1)
- if (IsDlgButtonChecked(hwndDlg,IDC_RADIO1))
- g_this->enabled=0;
- if (LOWORD(wParam) == IDC_RADIO2)
- if (IsDlgButtonChecked(hwndDlg,IDC_RADIO2))
- g_this->enabled=1;
- if (LOWORD(wParam) == IDC_RADIO3)
- if (IsDlgButtonChecked(hwndDlg,IDC_RADIO3))
- g_this->enabled=2;
- if (LOWORD(wParam) == IDC_RADIO4)
- if (IsDlgButtonChecked(hwndDlg,IDC_RADIO4))
- g_this->enabled=3;
- if (LOWORD(wParam) == IDC_ROUNDUP)
- if (IsDlgButtonChecked(hwndDlg,IDC_ROUNDUP))
- g_this->roundmode=1;
- if (LOWORD(wParam) == IDC_ROUNDDOWN)
- if (IsDlgButtonChecked(hwndDlg,IDC_ROUNDDOWN))
- g_this->roundmode=0;
- return 0;
- return 0;
- }
- return 0;
- }
- HWND C_THISCLASS::conf(HINSTANCE hInstance, HWND hwndParent)
- {
- g_this = this;
- return WASABI_API_CREATEDIALOG(IDD_CFG_BLUR,hwndParent,g_DlgProc);
- }
- #else
- C_RBASE *R_Blur(char *desc) { return NULL; }
- #endif
|