frsh: Export information about the last RTP contract and VRES

[frescor/ffmpeg.git] / libpostproc / postprocess_template.c
diff --git a/libpostproc/postprocess_template.c b/libpostproc/postprocess_template.c

index b03386e5cf2095e9744bd9d65c28d07c6cdad92b..6879dba8c1db71229281d7c63562be8e0bb0f1d0 100644 (file)
--- a/libpostproc/postprocess_template.c
+++ b/libpostproc/postprocess_template.c
@@ -19,7 +19,7 @@
   */
  
  /**
- * @file postprocess_template.c
+ * @file libpostproc/postprocess_template.c
   * mmx/mmx2/3dnow postprocess code.
   */
  
@@ -31,45 +31,45 @@
  #undef PMINUB
  #undef PMAXUB
  
-#ifdef HAVE_MMX2
+#if   HAVE_MMX2
  #define REAL_PAVGB(a,b) "pavgb " #a ", " #b " \n\t"
-#elif defined (HAVE_3DNOW)
+#elif HAVE_AMD3DNOW
  #define REAL_PAVGB(a,b) "pavgusb " #a ", " #b " \n\t"
  #endif
  #define PAVGB(a,b)  REAL_PAVGB(a,b)
  
-#ifdef HAVE_MMX2
+#if   HAVE_MMX2
  #define PMINUB(a,b,t) "pminub " #a ", " #b " \n\t"
-#elif defined (HAVE_MMX)
+#elif HAVE_MMX
  #define PMINUB(b,a,t) \
      "movq " #a ", " #t " \n\t"\
      "psubusb " #b ", " #t " \n\t"\
      "psubb " #t ", " #a " \n\t"
  #endif
  
-#ifdef HAVE_MMX2
+#if   HAVE_MMX2
  #define PMAXUB(a,b) "pmaxub " #a ", " #b " \n\t"
-#elif defined (HAVE_MMX)
+#elif HAVE_MMX
  #define PMAXUB(a,b) \
      "psubusb " #a ", " #b " \n\t"\
      "paddb " #a ", " #b " \n\t"
  #endif
  
  //FIXME? |255-0| = 1 (should not be a problem ...)
-#ifdef HAVE_MMX
+#if HAVE_MMX
  /**
   * Check if the middle 8x8 Block in the given 8x16 block is flat
   */
  static inline int RENAME(vertClassify)(uint8_t src[], int stride, PPContext *c){
      int numEq= 0, dcOk;
      src+= stride*4; // src points to begin of the 8x8 Block
-    asm volatile(
+    __asm__ volatile(
          "movq %0, %%mm7                         \n\t"
          "movq %1, %%mm6                         \n\t"
          : : "m" (c->mmxDcOffset[c->nonBQP]),  "m" (c->mmxDcThreshold[c->nonBQP])
          );
  
-    asm volatile(
+    __asm__ volatile(
          "lea (%2, %3), %%"REG_a"                \n\t"
  //      0       1       2       3       4       5       6       7       8       9
  //      %1      eax     eax+%2  eax+2%2 %1+4%2  ecx     ecx+%2  ecx+2%2 %1+8%2  ecx+4%2
@@ -136,7 +136,7 @@ static inline int RENAME(vertClassify)(uint8_t src[], int stride, PPContext *c){
          "psubusb %%mm3, %%mm4                   \n\t"
  
          "                                       \n\t"
-#ifdef HAVE_MMX2
+#if HAVE_MMX2
          "pxor %%mm7, %%mm7                      \n\t"
          "psadbw %%mm7, %%mm0                    \n\t"
  #else
@@ -158,7 +158,7 @@ static inline int RENAME(vertClassify)(uint8_t src[], int stride, PPContext *c){
          "movd %%mm4, %1                         \n\t"
  
          : "=r" (numEq), "=r" (dcOk)
-        : "r" (src), "r" ((long)stride), "m" (c->pQPb)
+        : "r" (src), "r" ((x86_reg)stride), "m" (c->pQPb)
          : "%"REG_a
          );
  
@@ -176,12 +176,12 @@ static inline int RENAME(vertClassify)(uint8_t src[], int stride, PPContext *c){
   * Do a vertical low pass filter on the 8x16 block (only write to the 8x8 block in the middle)
   * using the 9-Tap Filter (1,1,2,2,4,2,2,1,1)/16
   */
-#ifndef HAVE_ALTIVEC
+#if !HAVE_ALTIVEC
  static inline void RENAME(doVertLowPass)(uint8_t *src, int stride, PPContext *c)
  {
-#if defined (HAVE_MMX2) || defined (HAVE_3DNOW)
+#if HAVE_MMX2 || HAVE_AMD3DNOW
      src+= stride*3;
-    asm volatile(        //"movv %0 %1 %2\n\t"
+    __asm__ volatile(        //"movv %0 %1 %2\n\t"
          "movq %2, %%mm0                         \n\t"  // QP,..., QP
          "pxor %%mm4, %%mm4                      \n\t"
  
@@ -303,10 +303,10 @@ static inline void RENAME(doVertLowPass)(uint8_t *src, int stride, PPContext *c)
          "sub %1, %0                             \n\t"
  
          :
-        : "r" (src), "r" ((long)stride), "m" (c->pQPb)
+        : "r" (src), "r" ((x86_reg)stride), "m" (c->pQPb)
          : "%"REG_a, "%"REG_c
      );
-#else //defined (HAVE_MMX2) || defined (HAVE_3DNOW)
+#else //HAVE_MMX2 || HAVE_AMD3DNOW
      const int l1= stride;
      const int l2= stride + l1;
      const int l3= stride + l2;
@@ -345,7 +345,7 @@ static inline void RENAME(doVertLowPass)(uint8_t *src, int stride, PPContext *c)
  
          src++;
      }
-#endif //defined (HAVE_MMX2) || defined (HAVE_3DNOW)
+#endif //HAVE_MMX2 || HAVE_AMD3DNOW
  }
  #endif //HAVE_ALTIVEC
  
@@ -364,10 +364,10 @@ static inline void RENAME(doVertLowPass)(uint8_t *src, int stride, PPContext *c)
   */
  static inline void RENAME(vertRK1Filter)(uint8_t *src, int stride, int QP)
  {
-#if defined (HAVE_MMX2) || defined (HAVE_3DNOW)
+#if HAVE_MMX2 || HAVE_AMD3DNOW
      src+= stride*3;
  // FIXME rounding
-    asm volatile(
+    __asm__ volatile(
          "pxor %%mm7, %%mm7                      \n\t" // 0
          "movq "MANGLE(b80)", %%mm6              \n\t" // MIN_SIGNED_BYTE
          "leal (%0, %1), %%"REG_a"               \n\t"
@@ -423,10 +423,10 @@ static inline void RENAME(vertRK1Filter)(uint8_t *src, int stride, int QP)
          "movq %%mm2, (%%"REG_c", %1)            \n\t"
  
          :
-        : "r" (src), "r" ((long)stride)
+        : "r" (src), "r" ((x86_reg)stride)
          : "%"REG_a, "%"REG_c
      );
-#else //defined (HAVE_MMX2) || defined (HAVE_3DNOW)
+#else //HAVE_MMX2 || HAVE_AMD3DNOW
      const int l1= stride;
      const int l2= stride + l1;
      const int l3= stride + l2;
@@ -449,7 +449,7 @@ static inline void RENAME(vertRK1Filter)(uint8_t *src, int stride, int QP)
          }
      }
  
-#endif //defined (HAVE_MMX2) || defined (HAVE_3DNOW)
+#endif //HAVE_MMX2 || HAVE_AMD3DNOW
  }
  #endif //0
  
@@ -462,10 +462,10 @@ static inline void RENAME(vertRK1Filter)(uint8_t *src, int stride, int QP)
   */
  static inline void RENAME(vertX1Filter)(uint8_t *src, int stride, PPContext *co)
  {
-#if defined (HAVE_MMX2) || defined (HAVE_3DNOW)
+#if HAVE_MMX2 || HAVE_AMD3DNOW
      src+= stride*3;
  
-    asm volatile(
+    __asm__ volatile(
          "pxor %%mm7, %%mm7                      \n\t" // 0
          "lea (%0, %1), %%"REG_a"                \n\t"
          "lea (%%"REG_a", %1, 4), %%"REG_c"      \n\t"
@@ -545,10 +545,10 @@ static inline void RENAME(vertX1Filter)(uint8_t *src, int stride, PPContext *co)
          "movq %%mm0, (%%"REG_c", %1, 2)         \n\t" // line 7
  
          :
-        : "r" (src), "r" ((long)stride), "m" (co->pQPb)
+        : "r" (src), "r" ((x86_reg)stride), "m" (co->pQPb)
          : "%"REG_a, "%"REG_c
      );
-#else //defined (HAVE_MMX2) || defined (HAVE_3DNOW)
+#else //HAVE_MMX2 || HAVE_AMD3DNOW
  
      const int l1= stride;
      const int l2= stride + l1;
@@ -582,13 +582,13 @@ static inline void RENAME(vertX1Filter)(uint8_t *src, int stride, PPContext *co)
          }
          src++;
      }
-#endif //defined (HAVE_MMX2) || defined (HAVE_3DNOW)
+#endif //HAVE_MMX2 || HAVE_AMD3DNOW
  }
  
-#ifndef HAVE_ALTIVEC
+#if !HAVE_ALTIVEC
  static inline void RENAME(doVertDefFilter)(uint8_t src[], int stride, PPContext *c)
  {
-#if defined (HAVE_MMX2) || defined (HAVE_3DNOW)
+#if HAVE_MMX2 || HAVE_AMD3DNOW
  /*
      uint8_t tmp[16];
      const int l1= stride;
@@ -604,7 +604,7 @@ static inline void RENAME(doVertDefFilter)(uint8_t src[], int stride, PPContext
      memcpy(tmp+8, src+stride*8, 8);
  */
      src+= stride*4;
-    asm volatile(
+    __asm__ volatile(
  
  #if 0 //slightly more accurate and slightly slower
          "pxor %%mm7, %%mm7                      \n\t" // 0
@@ -810,7 +810,7 @@ static inline void RENAME(doVertDefFilter)(uint8_t src[], int stride, PPContext
          "movq %%mm2, (%0, %1, 4)                \n\t"
  
          :
-        : "r" (src), "r" ((long)stride), "m" (c->pQPb)
+        : "r" (src), "r" ((x86_reg)stride), "m" (c->pQPb)
          : "%"REG_a, "%"REG_c
      );
  
@@ -869,9 +869,9 @@ static inline void RENAME(doVertDefFilter)(uint8_t src[], int stride, PPContext
      }
  }
  */
-#elif defined (HAVE_MMX)
+#elif HAVE_MMX
      src+= stride*4;
-    asm volatile(
+    __asm__ volatile(
          "pxor %%mm7, %%mm7                      \n\t"
          "lea -40(%%"REG_SP"), %%"REG_c"         \n\t" // make space for 4 8-byte vars
          "and "ALIGN_MASK", %%"REG_c"            \n\t" // align
@@ -978,7 +978,7 @@ static inline void RENAME(doVertDefFilter)(uint8_t src[], int stride, PPContext
          "movq (%%"REG_c"), %%mm2                \n\t" // 2L0 - 5L1 + 5L2 - 2L3
          "movq 8(%%"REG_c"), %%mm3               \n\t" // 2H0 - 5H1 + 5H2 - 2H3
  
-#ifdef HAVE_MMX2
+#if HAVE_MMX2
          "movq %%mm7, %%mm6                      \n\t" // 0
          "psubw %%mm0, %%mm6                     \n\t"
          "pmaxsw %%mm6, %%mm0                    \n\t" // |2L4 - 5L5 + 5L6 - 2L7|
@@ -1010,7 +1010,7 @@ static inline void RENAME(doVertDefFilter)(uint8_t src[], int stride, PPContext
          "psubw %%mm6, %%mm3                     \n\t" // |2H0 - 5H1 + 5H2 - 2H3|
  #endif
  
-#ifdef HAVE_MMX2
+#if HAVE_MMX2
          "pminsw %%mm2, %%mm0                    \n\t"
          "pminsw %%mm3, %%mm1                    \n\t"
  #else
@@ -1074,7 +1074,7 @@ static inline void RENAME(doVertDefFilter)(uint8_t src[], int stride, PPContext
          "pand %%mm2, %%mm4                      \n\t"
          "pand %%mm3, %%mm5                      \n\t"
  
-#ifdef HAVE_MMX2
+#if HAVE_MMX2
          "pminsw %%mm0, %%mm4                    \n\t"
          "pminsw %%mm1, %%mm5                    \n\t"
  #else
@@ -1098,10 +1098,10 @@ static inline void RENAME(doVertDefFilter)(uint8_t src[], int stride, PPContext
          "movq %%mm0, (%0, %1)                   \n\t"
  
          : "+r" (src)
-        : "r" ((long)stride), "m" (c->pQPb)
+        : "r" ((x86_reg)stride), "m" (c->pQPb)
          : "%"REG_a, "%"REG_c
      );
-#else //defined (HAVE_MMX2) || defined (HAVE_3DNOW)
+#else //HAVE_MMX2 || HAVE_AMD3DNOW
      const int l1= stride;
      const int l2= stride + l1;
      const int l3= stride + l2;
@@ -1139,15 +1139,15 @@ static inline void RENAME(doVertDefFilter)(uint8_t src[], int stride, PPContext
          }
          src++;
      }
-#endif //defined (HAVE_MMX2) || defined (HAVE_3DNOW)
+#endif //HAVE_MMX2 || HAVE_AMD3DNOW
  }
  #endif //HAVE_ALTIVEC
  
-#ifndef HAVE_ALTIVEC
+#if !HAVE_ALTIVEC
  static inline void RENAME(dering)(uint8_t src[], int stride, PPContext *c)
  {
-#if defined (HAVE_MMX2) || defined (HAVE_3DNOW)
-    asm volatile(
+#if HAVE_MMX2 || HAVE_AMD3DNOW
+    __asm__ volatile(
          "pxor %%mm6, %%mm6                      \n\t"
          "pcmpeqb %%mm7, %%mm7                   \n\t"
          "movq %2, %%mm0                         \n\t"
@@ -1164,7 +1164,7 @@ static inline void RENAME(dering)(uint8_t src[], int stride, PPContext *c)
  //        %0        eax        eax+%1        eax+2%1        %0+4%1        edx        edx+%1        edx+2%1        %0+8%1        edx+4%1
  
  #undef FIND_MIN_MAX
-#ifdef HAVE_MMX2
+#if HAVE_MMX2
  #define REAL_FIND_MIN_MAX(addr)\
          "movq " #addr ", %%mm0                  \n\t"\
          "pminub %%mm0, %%mm7                    \n\t"\
@@ -1191,7 +1191,7 @@ FIND_MIN_MAX((%0, %1, 8))
  
          "movq %%mm7, %%mm4                      \n\t"
          "psrlq $8, %%mm7                        \n\t"
-#ifdef HAVE_MMX2
+#if HAVE_MMX2
          "pminub %%mm4, %%mm7                    \n\t" // min of pixels
          "pshufw $0xF9, %%mm7, %%mm4             \n\t"
          "pminub %%mm4, %%mm7                    \n\t" // min of pixels
@@ -1216,7 +1216,7 @@ FIND_MIN_MAX((%0, %1, 8))
  
          "movq %%mm6, %%mm4                      \n\t"
          "psrlq $8, %%mm6                        \n\t"
-#ifdef HAVE_MMX2
+#if HAVE_MMX2
          "pmaxub %%mm4, %%mm6                    \n\t" // max of pixels
          "pshufw $0xF9, %%mm6, %%mm4             \n\t"
          "pmaxub %%mm4, %%mm6                    \n\t"
@@ -1367,10 +1367,10 @@ DERING_CORE((%%REGd, %1, 2),(%0, %1, 8)    ,%%mm0,%%mm2,%%mm4,%%mm1,%%mm3,%%mm5,
  DERING_CORE((%0, %1, 8)    ,(%%REGd, %1, 4),%%mm2,%%mm4,%%mm0,%%mm3,%%mm5,%%mm1,%%mm6,%%mm7)
  
          "1:                        \n\t"
-        : : "r" (src), "r" ((long)stride), "m" (c->pQPb), "m"(c->pQPb2)
+        : : "r" (src), "r" ((x86_reg)stride), "m" (c->pQPb), "m"(c->pQPb2)
          : "%"REG_a, "%"REG_d, "%"REG_c
      );
-#else //defined (HAVE_MMX2) || defined (HAVE_3DNOW)
+#else //HAVE_MMX2 || HAVE_AMD3DNOW
      int y;
      int min=255;
      int max=0;
@@ -1431,7 +1431,7 @@ DERING_CORE((%0, %1, 8)    ,(%%REGd, %1, 4),%%mm2,%%mm4,%%mm0,%%mm3,%%mm5,%%mm1,
                  f= (f + 8)>>4;
  
  #ifdef DEBUG_DERING_THRESHOLD
-                    asm volatile("emms\n\t":);
+                    __asm__ volatile("emms\n\t":);
                      {
                      static long long numPixels=0;
                      if(x!=1 && x!=8 && y!=1 && y!=8) numPixels++;
@@ -1487,7 +1487,7 @@ DERING_CORE((%0, %1, 8)    ,(%%REGd, %1, 4),%%mm2,%%mm4,%%mm0,%%mm3,%%mm5,%%mm1,
  //        src[0] = src[7]=src[stride*7]=src[stride*7 + 7]=255;
      }
  #endif
-#endif //defined (HAVE_MMX2) || defined (HAVE_3DNOW)
+#endif //HAVE_MMX2 || HAVE_AMD3DNOW
  }
  #endif //HAVE_ALTIVEC
  
@@ -1499,9 +1499,9 @@ DERING_CORE((%0, %1, 8)    ,(%%REGd, %1, 4),%%mm2,%%mm4,%%mm0,%%mm3,%%mm5,%%mm1,
   */
  static inline void RENAME(deInterlaceInterpolateLinear)(uint8_t src[], int stride)
  {
-#if defined (HAVE_MMX2) || defined (HAVE_3DNOW)
+#if HAVE_MMX2 || HAVE_AMD3DNOW
      src+= 4*stride;
-    asm volatile(
+    __asm__ volatile(
          "lea (%0, %1), %%"REG_a"                \n\t"
          "lea (%%"REG_a", %1, 4), %%"REG_c"      \n\t"
  //      0       1       2       3       4       5       6       7       8       9
@@ -1521,7 +1521,7 @@ static inline void RENAME(deInterlaceInterpolateLinear)(uint8_t src[], int strid
          PAVGB(%%mm0, %%mm1)
          "movq %%mm1, (%%"REG_c", %1, 2)         \n\t"
  
-        : : "r" (src), "r" ((long)stride)
+        : : "r" (src), "r" ((x86_reg)stride)
          : "%"REG_a, "%"REG_c
      );
  #else
@@ -1552,9 +1552,9 @@ static inline void RENAME(deInterlaceInterpolateLinear)(uint8_t src[], int strid
   */
  static inline void RENAME(deInterlaceInterpolateCubic)(uint8_t src[], int stride)
  {
-#if defined (HAVE_MMX2) || defined (HAVE_3DNOW)
+#if HAVE_MMX2 || HAVE_AMD3DNOW
      src+= stride*3;
-    asm volatile(
+    __asm__ volatile(
          "lea (%0, %1), %%"REG_a"                \n\t"
          "lea (%%"REG_a", %1, 4), %%"REG_d"      \n\t"
          "lea (%%"REG_d", %1, 4), %%"REG_c"      \n\t"
@@ -1591,10 +1591,10 @@ DEINT_CUBIC((%%REGa, %1), (%0, %1, 4) , (%%REGd)       , (%%REGd, %1), (%0, %1,
  DEINT_CUBIC((%0, %1, 4) , (%%REGd, %1), (%%REGd, %1, 2), (%0, %1, 8) , (%%REGc))
  DEINT_CUBIC((%%REGd, %1), (%0, %1, 8) , (%%REGd, %1, 4), (%%REGc)    , (%%REGc, %1, 2))
  
-        : : "r" (src), "r" ((long)stride)
+        : : "r" (src), "r" ((x86_reg)stride)
          : "%"REG_a, "%"REG_d, "%"REG_c
      );
-#else //defined (HAVE_MMX2) || defined (HAVE_3DNOW)
+#else //HAVE_MMX2 || HAVE_AMD3DNOW
      int x;
      src+= stride*3;
      for(x=0; x<8; x++){
@@ -1604,7 +1604,7 @@ DEINT_CUBIC((%%REGd, %1), (%0, %1, 8) , (%%REGd, %1, 4), (%%REGc)    , (%%REGc,
          src[stride*9] = CLIP((-src[stride*6] + 9*src[stride*8] + 9*src[stride*10] - src[stride*12])>>4);
          src++;
      }
-#endif //defined (HAVE_MMX2) || defined (HAVE_3DNOW)
+#endif //HAVE_MMX2 || HAVE_AMD3DNOW
  }
  
  /**
@@ -1616,9 +1616,9 @@ DEINT_CUBIC((%%REGd, %1), (%0, %1, 8) , (%%REGd, %1, 4), (%%REGc)    , (%%REGc,
   */
  static inline void RENAME(deInterlaceFF)(uint8_t src[], int stride, uint8_t *tmp)
  {
-#if defined (HAVE_MMX2) || defined (HAVE_3DNOW)
+#if HAVE_MMX2 || HAVE_AMD3DNOW
      src+= stride*4;
-    asm volatile(
+    __asm__ volatile(
          "lea (%0, %1), %%"REG_a"                \n\t"
          "lea (%%"REG_a", %1, 4), %%"REG_d"      \n\t"
          "pxor %%mm7, %%mm7                      \n\t"
@@ -1662,10 +1662,10 @@ DEINT_FF((%0, %1, 4) , (%%REGd)       , (%%REGd, %1), (%%REGd, %1, 2))
  DEINT_FF((%%REGd, %1), (%%REGd, %1, 2), (%0, %1, 8) , (%%REGd, %1, 4))
  
          "movq %%mm0, (%2)                       \n\t"
-        : : "r" (src), "r" ((long)stride), "r"(tmp)
+        : : "r" (src), "r" ((x86_reg)stride), "r"(tmp)
          : "%"REG_a, "%"REG_d
      );
-#else //defined (HAVE_MMX2) || defined (HAVE_3DNOW)
+#else //HAVE_MMX2 || HAVE_AMD3DNOW
      int x;
      src+= stride*4;
      for(x=0; x<8; x++){
@@ -1683,7 +1683,7 @@ DEINT_FF((%%REGd, %1), (%%REGd, %1, 2), (%0, %1, 8) , (%%REGd, %1, 4))
  
          src++;
      }
-#endif //defined (HAVE_MMX2) || defined (HAVE_3DNOW)
+#endif //HAVE_MMX2 || HAVE_AMD3DNOW
  }
  
  /**
@@ -1695,9 +1695,9 @@ DEINT_FF((%%REGd, %1), (%%REGd, %1, 2), (%0, %1, 8) , (%%REGd, %1, 4))
   */
  static inline void RENAME(deInterlaceL5)(uint8_t src[], int stride, uint8_t *tmp, uint8_t *tmp2)
  {
-#if defined (HAVE_MMX2) || defined (HAVE_3DNOW)
+#if HAVE_MMX2 || HAVE_AMD3DNOW
      src+= stride*4;
-    asm volatile(
+    __asm__ volatile(
          "lea (%0, %1), %%"REG_a"                \n\t"
          "lea (%%"REG_a", %1, 4), %%"REG_d"      \n\t"
          "pxor %%mm7, %%mm7                      \n\t"
@@ -1752,10 +1752,10 @@ DEINT_L5(%%mm1, %%mm0, (%%REGd, %1, 2), (%0, %1, 8)    , (%%REGd, %1, 4))
  
          "movq %%mm0, (%2)                       \n\t"
          "movq %%mm1, (%3)                       \n\t"
-        : : "r" (src), "r" ((long)stride), "r"(tmp), "r"(tmp2)
+        : : "r" (src), "r" ((x86_reg)stride), "r"(tmp), "r"(tmp2)
          : "%"REG_a, "%"REG_d
      );
-#else //defined (HAVE_MMX2) || defined (HAVE_3DNOW)
+#else //HAVE_MMX2 || HAVE_AMD3DNOW
      int x;
      src+= stride*4;
      for(x=0; x<8; x++){
@@ -1784,7 +1784,7 @@ DEINT_L5(%%mm1, %%mm0, (%%REGd, %1, 2), (%0, %1, 8)    , (%%REGd, %1, 4))
  
          src++;
      }
-#endif //defined (HAVE_MMX2) || defined (HAVE_3DNOW)
+#endif //HAVE_MMX2 || HAVE_AMD3DNOW
  }
  
  /**
@@ -1796,9 +1796,9 @@ DEINT_L5(%%mm1, %%mm0, (%%REGd, %1, 2), (%0, %1, 8)    , (%%REGd, %1, 4))
   */
  static inline void RENAME(deInterlaceBlendLinear)(uint8_t src[], int stride, uint8_t *tmp)
  {
-#if defined (HAVE_MMX2) || defined (HAVE_3DNOW)
+#if HAVE_MMX2 || HAVE_AMD3DNOW
      src+= 4*stride;
-    asm volatile(
+    __asm__ volatile(
          "lea (%0, %1), %%"REG_a"                \n\t"
          "lea (%%"REG_a", %1, 4), %%"REG_d"      \n\t"
  //      0       1       2       3       4       5       6       7       8       9
@@ -1840,10 +1840,10 @@ static inline void RENAME(deInterlaceBlendLinear)(uint8_t src[], int stride, uin
          "movq %%mm2, (%%"REG_d", %1, 2)         \n\t"
          "movq %%mm1, (%2)                       \n\t"
  
-        : : "r" (src), "r" ((long)stride), "r" (tmp)
+        : : "r" (src), "r" ((x86_reg)stride), "r" (tmp)
          : "%"REG_a, "%"REG_d
      );
-#else //defined (HAVE_MMX2) || defined (HAVE_3DNOW)
+#else //HAVE_MMX2 || HAVE_AMD3DNOW
      int a, b, c, x;
      src+= 4*stride;
  
@@ -1886,7 +1886,7 @@ static inline void RENAME(deInterlaceBlendLinear)(uint8_t src[], int stride, uin
          src += 4;
          tmp += 4;
      }
-#endif //defined (HAVE_MMX2) || defined (HAVE_3DNOW)
+#endif //HAVE_MMX2 || HAVE_AMD3DNOW
  }
  
  /**
@@ -1897,10 +1897,10 @@ static inline void RENAME(deInterlaceBlendLinear)(uint8_t src[], int stride, uin
   */
  static inline void RENAME(deInterlaceMedian)(uint8_t src[], int stride)
  {
-#ifdef HAVE_MMX
+#if HAVE_MMX
      src+= 4*stride;
-#ifdef HAVE_MMX2
-    asm volatile(
+#if HAVE_MMX2
+    __asm__ volatile(
          "lea (%0, %1), %%"REG_a"                \n\t"
          "lea (%%"REG_a", %1, 4), %%"REG_d"      \n\t"
  //      0       1       2       3       4       5       6       7       8       9
@@ -1944,12 +1944,12 @@ static inline void RENAME(deInterlaceMedian)(uint8_t src[], int stride)
          "movq %%mm2, (%%"REG_d", %1, 2)         \n\t"
  
  
-        : : "r" (src), "r" ((long)stride)
+        : : "r" (src), "r" ((x86_reg)stride)
          : "%"REG_a, "%"REG_d
      );
  
  #else // MMX without MMX2
-    asm volatile(
+    __asm__ volatile(
          "lea (%0, %1), %%"REG_a"                \n\t"
          "lea (%%"REG_a", %1, 4), %%"REG_d"      \n\t"
  //      0       1       2       3       4       5       6       7       8       9
@@ -1986,7 +1986,7 @@ MEDIAN((%%REGa, %1), (%%REGa, %1, 2), (%0, %1, 4))
  MEDIAN((%0, %1, 4) , (%%REGd)       , (%%REGd, %1))
  MEDIAN((%%REGd, %1), (%%REGd, %1, 2), (%0, %1, 8))
  
-        : : "r" (src), "r" ((long)stride)
+        : : "r" (src), "r" ((x86_reg)stride)
          : "%"REG_a, "%"REG_d
      );
  #endif //HAVE_MMX2
@@ -2012,13 +2012,13 @@ MEDIAN((%%REGd, %1), (%%REGd, %1, 2), (%0, %1, 8))
  #endif //HAVE_MMX
  }
  
-#ifdef HAVE_MMX
+#if HAVE_MMX
  /**
   * transposes and shift the given 8x8 Block into dst1 and dst2
   */
  static inline void RENAME(transpose1)(uint8_t *dst1, uint8_t *dst2, uint8_t *src, int srcStride)
  {
-    asm(
+    __asm__(
          "lea (%0, %1), %%"REG_a"                \n\t"
  //      0       1       2       3       4       5       6       7       8       9
  //      %0      eax     eax+%1  eax+2%1 %0+4%1  edx     edx+%1  edx+2%1 %0+8%1  edx+4%1
@@ -2093,7 +2093,7 @@ static inline void RENAME(transpose1)(uint8_t *dst1, uint8_t *dst2, uint8_t *src
          "movd %%mm1, 116(%3)                    \n\t"
  
  
-        :: "r" (src), "r" ((long)srcStride), "r" (dst1), "r" (dst2)
+        :: "r" (src), "r" ((x86_reg)srcStride), "r" (dst1), "r" (dst2)
          : "%"REG_a
      );
  }
@@ -2103,7 +2103,7 @@ static inline void RENAME(transpose1)(uint8_t *dst1, uint8_t *dst2, uint8_t *src
   */
  static inline void RENAME(transpose2)(uint8_t *dst, int dstStride, uint8_t *src)
  {
-    asm(
+    __asm__(
          "lea (%0, %1), %%"REG_a"                \n\t"
          "lea (%%"REG_a",%1,4), %%"REG_d"        \n\t"
  //      0       1       2       3       4       5       6       7       8       9
@@ -2173,14 +2173,14 @@ static inline void RENAME(transpose2)(uint8_t *dst, int dstStride, uint8_t *src)
          "psrlq $32, %%mm1                       \n\t"
          "movd %%mm1, 4(%%"REG_d", %1, 2)        \n\t"
  
-        :: "r" (dst), "r" ((long)dstStride), "r" (src)
+        :: "r" (dst), "r" ((x86_reg)dstStride), "r" (src)
          : "%"REG_a, "%"REG_d
      );
  }
  #endif //HAVE_MMX
  //static long test=0;
  
-#ifndef HAVE_ALTIVEC
+#if !HAVE_ALTIVEC
  static inline void RENAME(tempNoiseReducer)(uint8_t *src, int stride,
                                      uint8_t *tempBlurred, uint32_t *tempBlurredPast, int *maxNoise)
  {
@@ -2191,8 +2191,8 @@ static inline void RENAME(tempNoiseReducer)(uint8_t *src, int stride,
  
  #define FAST_L2_DIFF
  //#define L1_DIFF //u should change the thresholds too if u try that one
-#if defined (HAVE_MMX2) || defined (HAVE_3DNOW)
-    asm volatile(
+#if HAVE_MMX2 || HAVE_AMD3DNOW
+    __asm__ volatile(
          "lea (%2, %2, 2), %%"REG_a"             \n\t" // 3*stride
          "lea (%2, %2, 4), %%"REG_d"             \n\t" // 5*stride
          "lea (%%"REG_d", %2, 2), %%"REG_c"      \n\t" // 7*stride
@@ -2476,10 +2476,10 @@ L2_DIFF_CORE((%0, %%REGc)  , (%1, %%REGc))
  
          "4:                                     \n\t"
  
-        :: "r" (src), "r" (tempBlurred), "r"((long)stride), "m" (tempBlurredPast)
+        :: "r" (src), "r" (tempBlurred), "r"((x86_reg)stride), "m" (tempBlurredPast)
          : "%"REG_a, "%"REG_d, "%"REG_c, "memory"
      );
-#else //defined (HAVE_MMX2) || defined (HAVE_3DNOW)
+#else //HAVE_MMX2 || HAVE_AMD3DNOW
  {
      int y;
      int d=0;
@@ -2562,11 +2562,11 @@ Switch between
          }
      }
  }
-#endif //defined (HAVE_MMX2) || defined (HAVE_3DNOW)
+#endif //HAVE_MMX2 || HAVE_AMD3DNOW
  }
  #endif //HAVE_ALTIVEC
  
-#ifdef HAVE_MMX
+#if HAVE_MMX
  /**
   * accurate deblock filter
   */
@@ -2575,13 +2575,13 @@ static av_always_inline void RENAME(do_a_deblock)(uint8_t *src, int step, int st
      int64_t sums[10*8*2];
      src+= step*3; // src points to begin of the 8x8 Block
  //START_TIMER
-    asm volatile(
+    __asm__ volatile(
          "movq %0, %%mm7                         \n\t"
          "movq %1, %%mm6                         \n\t"
          : : "m" (c->mmxDcOffset[c->nonBQP]),  "m" (c->mmxDcThreshold[c->nonBQP])
          );
  
-    asm volatile(
+    __asm__ volatile(
          "lea (%2, %3), %%"REG_a"                \n\t"
  //      0       1       2       3       4       5       6       7       8       9
  //      %1      eax     eax+%2  eax+2%2 %1+4%2  ecx     ecx+%2  ecx+2%2 %1+8%2  ecx+4%2
@@ -2676,17 +2676,17 @@ static av_always_inline void RENAME(do_a_deblock)(uint8_t *src, int step, int st
          "movq %%mm6, %0                         \n\t"
  
          : "=m" (eq_mask), "=m" (dc_mask)
-        : "r" (src), "r" ((long)step), "m" (c->pQPb), "m"(c->ppMode.flatnessThreshold)
+        : "r" (src), "r" ((x86_reg)step), "m" (c->pQPb), "m"(c->ppMode.flatnessThreshold)
          : "%"REG_a
      );
  
      both_masks = dc_mask & eq_mask;
  
      if(both_masks){
-        long offset= -8*step;
+        x86_reg offset= -8*step;
          int64_t *temp_sums= sums;
  
-        asm volatile(
+        __asm__ volatile(
              "movq %2, %%mm0                         \n\t"  // QP,..., QP
              "pxor %%mm4, %%mm4                      \n\t"
  
@@ -2820,12 +2820,12 @@ static av_always_inline void RENAME(do_a_deblock)(uint8_t *src, int step, int st
              "mov %4, %0                             \n\t" //FIXME
  
              : "+&r"(src)
-            : "r" ((long)step), "m" (c->pQPb), "r"(sums), "g"(src)
+            : "r" ((x86_reg)step), "m" (c->pQPb), "r"(sums), "g"(src)
          );
  
          src+= step; // src points to begin of the 8x8 Block
  
-        asm volatile(
+        __asm__ volatile(
              "movq %4, %%mm6                         \n\t"
              "pcmpeqb %%mm5, %%mm5                   \n\t"
              "pxor %%mm6, %%mm5                      \n\t"
@@ -2857,14 +2857,14 @@ static av_always_inline void RENAME(do_a_deblock)(uint8_t *src, int step, int st
              " js 1b                                 \n\t"
  
              : "+r"(offset), "+r"(temp_sums)
-            : "r" ((long)step), "r"(src - offset), "m"(both_masks)
+            : "r" ((x86_reg)step), "r"(src - offset), "m"(both_masks)
          );
      }else
          src+= step; // src points to begin of the 8x8 Block
  
      if(eq_mask != -1LL){
          uint8_t *temp_src= src;
-        asm volatile(
+        __asm__ volatile(
              "pxor %%mm7, %%mm7                      \n\t"
              "lea -40(%%"REG_SP"), %%"REG_c"         \n\t" // make space for 4 8-byte vars
              "and "ALIGN_MASK", %%"REG_c"            \n\t" // align
@@ -2970,7 +2970,7 @@ static av_always_inline void RENAME(do_a_deblock)(uint8_t *src, int step, int st
              "movq (%%"REG_c"), %%mm2                \n\t" // 2L0 - 5L1 + 5L2 - 2L3
              "movq 8(%%"REG_c"), %%mm3               \n\t" // 2H0 - 5H1 + 5H2 - 2H3
  
-#ifdef HAVE_MMX2
+#if HAVE_MMX2
              "movq %%mm7, %%mm6                      \n\t" // 0
              "psubw %%mm0, %%mm6                     \n\t"
              "pmaxsw %%mm6, %%mm0                    \n\t" // |2L4 - 5L5 + 5L6 - 2L7|
@@ -3002,7 +3002,7 @@ static av_always_inline void RENAME(do_a_deblock)(uint8_t *src, int step, int st
              "psubw %%mm6, %%mm3                     \n\t" // |2H0 - 5H1 + 5H2 - 2H3|
  #endif
  
-#ifdef HAVE_MMX2
+#if HAVE_MMX2
              "pminsw %%mm2, %%mm0                    \n\t"
              "pminsw %%mm3, %%mm1                    \n\t"
  #else
@@ -3066,7 +3066,7 @@ static av_always_inline void RENAME(do_a_deblock)(uint8_t *src, int step, int st
              "pand %%mm2, %%mm4                      \n\t"
              "pand %%mm3, %%mm5                      \n\t"
  
-#ifdef HAVE_MMX2
+#if HAVE_MMX2
              "pminsw %%mm0, %%mm4                    \n\t"
              "pminsw %%mm1, %%mm5                    \n\t"
  #else
@@ -3092,7 +3092,7 @@ static av_always_inline void RENAME(do_a_deblock)(uint8_t *src, int step, int st
              "movq %%mm0, (%0, %1)                   \n\t"
  
              : "+r" (temp_src)
-            : "r" ((long)step), "m" (c->pQPb), "m"(eq_mask)
+            : "r" ((x86_reg)step), "m" (c->pQPb), "m"(eq_mask)
              : "%"REG_a, "%"REG_c
          );
      }
@@ -3116,18 +3116,18 @@ static void RENAME(postProcess)(const uint8_t src[], int srcStride, uint8_t dst[
  static inline void RENAME(blockCopy)(uint8_t dst[], int dstStride, const uint8_t src[], int srcStride,
                                       int levelFix, int64_t *packedOffsetAndScale)
  {
-#ifndef HAVE_MMX
+#if !HAVE_MMX
      int i;
  #endif
      if(levelFix){
-#ifdef HAVE_MMX
-    asm volatile(
+#if HAVE_MMX
+    __asm__ volatile(
          "movq (%%"REG_a"), %%mm2        \n\t" // packedYOffset
          "movq 8(%%"REG_a"), %%mm3       \n\t" // packedYScale
          "lea (%2,%4), %%"REG_a"         \n\t"
          "lea (%3,%5), %%"REG_d"         \n\t"
          "pxor %%mm4, %%mm4              \n\t"
-#ifdef HAVE_MMX2
+#if HAVE_MMX2
  #define REAL_SCALED_CPY(src1, src2, dst1, dst2)                                                \
          "movq " #src1 ", %%mm0          \n\t"\
          "movq " #src1 ", %%mm5          \n\t"\
@@ -3193,8 +3193,8 @@ SCALED_CPY((%%REGa, %4), (%%REGa, %4, 2), (%%REGd, %5), (%%REGd, %5, 2))
          : "0" (packedOffsetAndScale),
          "r"(src),
          "r"(dst),
-        "r" ((long)srcStride),
-        "r" ((long)dstStride)
+        "r" ((x86_reg)srcStride),
+        "r" ((x86_reg)dstStride)
          : "%"REG_d
      );
  #else //HAVE_MMX
@@ -3203,8 +3203,8 @@ SCALED_CPY((%%REGa, %4), (%%REGa, %4, 2), (%%REGd, %5), (%%REGd, %5, 2))
                  &(src[srcStride*i]), BLOCK_SIZE);
  #endif //HAVE_MMX
      }else{
-#ifdef HAVE_MMX
-    asm volatile(
+#if HAVE_MMX
+    __asm__ volatile(
          "lea (%0,%2), %%"REG_a"                 \n\t"
          "lea (%1,%3), %%"REG_d"                 \n\t"
  
@@ -3226,8 +3226,8 @@ SIMPLE_CPY((%%REGa, %2), (%%REGa, %2, 2), (%%REGd, %3), (%%REGd, %3, 2))
  
          : : "r" (src),
          "r" (dst),
-        "r" ((long)srcStride),
-        "r" ((long)dstStride)
+        "r" ((x86_reg)srcStride),
+        "r" ((x86_reg)dstStride)
          : "%"REG_a, "%"REG_d
      );
  #else //HAVE_MMX
@@ -3243,15 +3243,15 @@ SIMPLE_CPY((%%REGa, %2), (%%REGa, %2, 2), (%%REGd, %3), (%%REGd, %3, 2))
   */
  static inline void RENAME(duplicate)(uint8_t src[], int stride)
  {
-#ifdef HAVE_MMX
-    asm volatile(
+#if HAVE_MMX
+    __asm__ volatile(
          "movq (%0), %%mm0               \n\t"
          "add %1, %0                     \n\t"
          "movq %%mm0, (%0)               \n\t"
          "movq %%mm0, (%0, %1)           \n\t"
          "movq %%mm0, (%0, %1, 2)        \n\t"
          : "+r" (src)
-        : "r" ((long)-stride)
+        : "r" ((x86_reg)-stride)
      );
  #else
      int i;
@@ -3280,7 +3280,7 @@ static void RENAME(postProcess)(const uint8_t src[], int srcStride, uint8_t dst[
      int QPCorrecture= 256*256;
  
      int copyAhead;
-#ifdef HAVE_MMX
+#if HAVE_MMX
      int i;
  #endif
  
@@ -3293,7 +3293,7 @@ static void RENAME(postProcess)(const uint8_t src[], int srcStride, uint8_t dst[
      uint8_t * const tempDst= dstStride > 0 ? c.tempDst : c.tempDst - 23*dstStride;
      //const int mbWidth= isColor ? (width+7)>>3 : (width+15)>>4;
  
-#ifdef HAVE_MMX
+#if HAVE_MMX
      for(i=0; i<57; i++){
          int offset= ((i*c.ppMode.baseDcDiff)>>8) + 1;
          int threshold= offset*2 + 1;
@@ -3351,7 +3351,7 @@ static void RENAME(postProcess)(const uint8_t src[], int srcStride, uint8_t dst[
  
          scale= (double)(c.ppMode.maxAllowedY - c.ppMode.minAllowedY) / (double)(white-black);
  
-#ifdef HAVE_MMX2
+#if HAVE_MMX2
          c.packedYScale= (uint16_t)(scale*256.0 + 0.5);
          c.packedYOffset= (((black*c.packedYScale)>>8) - c.ppMode.minAllowedY) & 0xFFFF;
  #else
@@ -3384,7 +3384,7 @@ static void RENAME(postProcess)(const uint8_t src[], int srcStride, uint8_t dst[
          // with the L1 Cache of the P4 ... or only a few blocks at a time or soemthing
          for(x=0; x<width; x+=BLOCK_SIZE){
  
-#ifdef HAVE_MMX2
+#if HAVE_MMX2
  /*
              prefetchnta(srcBlock + (((x>>2)&6) + 5)*srcStride + 32);
              prefetchnta(srcBlock + (((x>>2)&6) + 6)*srcStride + 32);
@@ -3392,7 +3392,7 @@ static void RENAME(postProcess)(const uint8_t src[], int srcStride, uint8_t dst[
              prefetcht0(dstBlock + (((x>>2)&6) + 6)*dstStride + 32);
  */
  
-            asm(
+            __asm__(
                  "mov %4, %%"REG_a"              \n\t"
                  "shr $2, %%"REG_a"              \n\t"
                  "and $6, %%"REG_a"              \n\t"
@@ -3406,12 +3406,12 @@ static void RENAME(postProcess)(const uint8_t src[], int srcStride, uint8_t dst[
                  "add %3, %%"REG_d"              \n\t"
                  "prefetchnta 32(%%"REG_a", %0)  \n\t"
                  "prefetcht0 32(%%"REG_d", %2)   \n\t"
-                :: "r" (srcBlock), "r" ((long)srcStride), "r" (dstBlock), "r" ((long)dstStride),
-                "g" ((long)x), "g" ((long)copyAhead)
+                :: "r" (srcBlock), "r" ((x86_reg)srcStride), "r" (dstBlock), "r" ((x86_reg)dstStride),
+                "g" ((x86_reg)x), "g" ((x86_reg)copyAhead)
                  : "%"REG_a, "%"REG_d
              );
  
-#elif defined(HAVE_3DNOW)
+#elif HAVE_AMD3DNOW
  //FIXME check if this is faster on an 3dnow chip or if it is faster without the prefetch or ...
  /*          prefetch(srcBlock + (((x>>3)&3) + 5)*srcStride + 32);
              prefetch(srcBlock + (((x>>3)&3) + 9)*srcStride + 32);
@@ -3457,7 +3457,7 @@ static void RENAME(postProcess)(const uint8_t src[], int srcStride, uint8_t dst[
          //1% speedup if these are here instead of the inner loop
          const uint8_t *srcBlock= &(src[y*srcStride]);
          uint8_t *dstBlock= &(dst[y*dstStride]);
-#ifdef HAVE_MMX
+#if HAVE_MMX
          uint8_t *tempBlock1= c.tempBlocks;
          uint8_t *tempBlock2= c.tempBlocks + 8;
  #endif
@@ -3493,7 +3493,7 @@ static void RENAME(postProcess)(const uint8_t src[], int srcStride, uint8_t dst[
          // with the L1 Cache of the P4 ... or only a few blocks at a time or soemthing
          for(x=0; x<width; x+=BLOCK_SIZE){
              const int stride= dstStride;
-#ifdef HAVE_MMX
+#if HAVE_MMX
              uint8_t *tmpXchg;
  #endif
              if(isColor){
@@ -3507,8 +3507,8 @@ static void RENAME(postProcess)(const uint8_t src[], int srcStride, uint8_t dst[
                  yHistogram[ srcBlock[srcStride*12 + 4] ]++;
              }
              c.QP= QP;
-#ifdef HAVE_MMX
-            asm volatile(
+#if HAVE_MMX
+            __asm__ volatile(
                  "movd %1, %%mm7         \n\t"
                  "packuswb %%mm7, %%mm7  \n\t" // 0, 0, 0, QP, 0, 0, 0, QP
                  "packuswb %%mm7, %%mm7  \n\t" // 0,QP, 0, QP, 0,QP, 0, QP
@@ -3520,7 +3520,7 @@ static void RENAME(postProcess)(const uint8_t src[], int srcStride, uint8_t dst[
  #endif
  
  
-#ifdef HAVE_MMX2
+#if HAVE_MMX2
  /*
              prefetchnta(srcBlock + (((x>>2)&6) + 5)*srcStride + 32);
              prefetchnta(srcBlock + (((x>>2)&6) + 6)*srcStride + 32);
@@ -3528,7 +3528,7 @@ static void RENAME(postProcess)(const uint8_t src[], int srcStride, uint8_t dst[
              prefetcht0(dstBlock + (((x>>2)&6) + 6)*dstStride + 32);
  */
  
-            asm(
+            __asm__(
                  "mov %4, %%"REG_a"              \n\t"
                  "shr $2, %%"REG_a"              \n\t"
                  "and $6, %%"REG_a"              \n\t"
@@ -3542,12 +3542,12 @@ static void RENAME(postProcess)(const uint8_t src[], int srcStride, uint8_t dst[
                  "add %3, %%"REG_d"              \n\t"
                  "prefetchnta 32(%%"REG_a", %0)  \n\t"
                  "prefetcht0 32(%%"REG_d", %2)   \n\t"
-                :: "r" (srcBlock), "r" ((long)srcStride), "r" (dstBlock), "r" ((long)dstStride),
-                "g" ((long)x), "g" ((long)copyAhead)
+                :: "r" (srcBlock), "r" ((x86_reg)srcStride), "r" (dstBlock), "r" ((x86_reg)dstStride),
+                "g" ((x86_reg)x), "g" ((x86_reg)copyAhead)
                  : "%"REG_a, "%"REG_d
              );
  
-#elif defined(HAVE_3DNOW)
+#elif HAVE_AMD3DNOW
  //FIXME check if this is faster on an 3dnow chip or if it is faster without the prefetch or ...
  /*          prefetch(srcBlock + (((x>>3)&3) + 5)*srcStride + 32);
              prefetch(srcBlock + (((x>>3)&3) + 9)*srcStride + 32);
@@ -3591,12 +3591,12 @@ static void RENAME(postProcess)(const uint8_t src[], int srcStride, uint8_t dst[
                  }
              }
  
-#ifdef HAVE_MMX
+#if HAVE_MMX
              RENAME(transpose1)(tempBlock1, tempBlock2, dstBlock, dstStride);
  #endif
              /* check if we have a previous block to deblock it with dstBlock */
              if(x - 8 >= 0){
-#ifdef HAVE_MMX
+#if HAVE_MMX
                  if(mode & H_X1_FILTER)
                          RENAME(vertX1Filter)(tempBlock1, 16, &c);
                  else if(mode & H_DEBLOCK){
@@ -3617,7 +3617,7 @@ static void RENAME(postProcess)(const uint8_t src[], int srcStride, uint8_t dst[
                  if(mode & H_X1_FILTER)
                      horizX1Filter(dstBlock-4, stride, QP);
                  else if(mode & H_DEBLOCK){
-#ifdef HAVE_ALTIVEC
+#if HAVE_ALTIVEC
                      DECLARE_ALIGNED(16, unsigned char, tempBlock[272]);
                      transpose_16x8_char_toPackedAlign_altivec(tempBlock, dstBlock - (4 + 1), stride);
  
@@ -3659,7 +3659,7 @@ static void RENAME(postProcess)(const uint8_t src[], int srcStride, uint8_t dst[
              dstBlock+=8;
              srcBlock+=8;
  
-#ifdef HAVE_MMX
+#if HAVE_MMX
              tmpXchg= tempBlock1;
              tempBlock1= tempBlock2;
              tempBlock2 = tmpXchg;
@@ -3699,10 +3699,10 @@ static void RENAME(postProcess)(const uint8_t src[], int srcStride, uint8_t dst[
                  + dstBlock[x +14*dstStride] + dstBlock[x +15*dstStride];
          }*/
      }
-#ifdef HAVE_3DNOW
-    asm volatile("femms");
-#elif defined (HAVE_MMX)
-    asm volatile("emms");
+#if   HAVE_AMD3DNOW
+    __asm__ volatile("femms");
+#elif HAVE_MMX
+    __asm__ volatile("emms");
  #endif
  
  #ifdef DEBUG_BRIGHTNESS