xine-lib 1.2.11
greedyhmacros.h
Go to the documentation of this file.
1
2// Copyright (c) 2001 Tom Barry. All rights reserved.
4//
5// This file is subject to the terms of the GNU General Public License as
6// published by the Free Software Foundation. A copy of this license is
7// included with this software distribution in the file COPYING. If you
8// do not have a copy, you may obtain a copy by writing to the Free
9// Software Foundation, 675 Mass Ave, Cambridge, MA 02139, USA.
10//
11// This software is distributed in the hope that it will be useful,
12// but WITHOUT ANY WARRANTY; without even the implied warranty of
13// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
14// GNU General Public License for more details
15//
17
18// Define a few macros for CPU dependent instructions.
19// I suspect I don't really understand how the C macro preprocessor works but
20// this seems to get the job done. // TRB 7/01
21
22// BEFORE USING THESE YOU MUST SET:
23
24// #define SSE_TYPE SSE (or MMX or 3DNOW)
25
26// some macros for pavgb instruction
27// V_PAVGB(mmr1, mmr2, mmr work register, smask) mmr2 may = mmrw if you can trash it
28
29#define V_PAVGB_MMX(mmr1, mmr2, mmrw, smask) \
30 "movq "mmr2", "mmrw"\n\t" \
31 "pand "smask", "mmrw"\n\t" \
32 "psrlw $1, "mmrw"\n\t" \
33 "pand "smask", "mmr1"\n\t" \
34 "psrlw $1, "mmr1"\n\t" \
35 "paddusb "mmrw", "mmr1"\n\t"
36#define V_PAVGB_SSE(mmr1, mmr2, mmrw, smask) "pavgb "mmr2", "mmr1"\n\t"
37#define V_PAVGB_3DNOW(mmr1, mmr2, mmrw, smask) "pavgusb "mmr2", "mmr1"\n\t"
38#define V_PAVGB(mmr1, mmr2, mmrw, smask) V_PAVGB2(mmr1, mmr2, mmrw, smask, SSE_TYPE)
39#define V_PAVGB2(mmr1, mmr2, mmrw, smask, ssetyp) V_PAVGB3(mmr1, mmr2, mmrw, smask, ssetyp)
40#define V_PAVGB3(mmr1, mmr2, mmrw, smask, ssetyp) V_PAVGB_##ssetyp(mmr1, mmr2, mmrw, smask)
41
42// some macros for pmaxub instruction
43#define V_PMAXUB_MMX(mmr1, mmr2) \
44 "psubusb "mmr2", "mmr1"\n\t" \
45 "paddusb "mmr2", "mmr1"\n\t"
46#define V_PMAXUB_SSE(mmr1, mmr2) "pmaxub "mmr2", "mmr1"\n\t"
47#define V_PMAXUB_3DNOW(mmr1, mmr2) V_PMAXUB_MMX(mmr1, mmr2) // use MMX version
48#define V_PMAXUB(mmr1, mmr2) V_PMAXUB2(mmr1, mmr2, SSE_TYPE)
49#define V_PMAXUB2(mmr1, mmr2, ssetyp) V_PMAXUB3(mmr1, mmr2, ssetyp)
50#define V_PMAXUB3(mmr1, mmr2, ssetyp) V_PMAXUB_##ssetyp(mmr1, mmr2)
51
52// some macros for pminub instruction
53// V_PMINUB(mmr1, mmr2, mmr work register) mmr2 may NOT = mmrw
54#define V_PMINUB_MMX(mmr1, mmr2, mmrw) \
55 "pcmpeqb "mmrw", "mmrw"\n\t" \
56 "psubusb "mmr2", "mmrw"\n\t" \
57 "paddusb "mmrw", "mmr1"\n\t" \
58 "psubusb "mmrw", "mmr1"\n\t"
59#define V_PMINUB_SSE(mmr1, mmr2, mmrw) "pminub "mmr2", "mmr1"\n\t"
60#define V_PMINUB_3DNOW(mmr1, mmr2, mmrw) V_PMINUB_MMX(mmr1, mmr2, mmrw) // use MMX version
61#define V_PMINUB(mmr1, mmr2, mmrw) V_PMINUB2(mmr1, mmr2, mmrw, SSE_TYPE)
62#define V_PMINUB2(mmr1, mmr2, mmrw, ssetyp) V_PMINUB3(mmr1, mmr2, mmrw, ssetyp)
63#define V_PMINUB3(mmr1, mmr2, mmrw, ssetyp) V_PMINUB_##ssetyp(mmr1, mmr2, mmrw)
64
65// some macros for movntq instruction
66// V_MOVNTQ(mmr1, mmr2)
67#define V_MOVNTQ_MMX(mmr1, mmr2) "movq "mmr2", "mmr1"\n\t"
68#define V_MOVNTQ_3DNOW(mmr1, mmr2) "movq "mmr2", "mmr1"\n\t"
69#define V_MOVNTQ_SSE(mmr1, mmr2) "movntq "mmr2", "mmr1"\n\t"
70#define V_MOVNTQ(mmr1, mmr2) V_MOVNTQ2(mmr1, mmr2, SSE_TYPE)
71#define V_MOVNTQ2(mmr1, mmr2, ssetyp) V_MOVNTQ3(mmr1, mmr2, ssetyp)
72#define V_MOVNTQ3(mmr1, mmr2, ssetyp) V_MOVNTQ_##ssetyp(mmr1, mmr2)
73
74// end of macros