+// DC quant of a whole 2x2 block
+#define QUANT_4_U_DC( idx0 ) \
+const vec_u16_t sel = (vec_u16_t) CV(-1,-1,-1,-1,0,0,0,0); \
+temp1v = vec_ld((idx0), *dct); \
+mskA = vec_cmplt(temp1v, zerov); \
+coefvA = (vec_u16_t) vec_max(vec_sub(zerov, temp1v), temp1v); \
+coefvA = vec_add(coefvA, biasv); \
+multEvenvA = vec_mule(coefvA, mfv); \
+multOddvA = vec_mulo(coefvA, mfv); \
+multEvenvA = vec_sr(multEvenvA, i_qbitsv); \
+multOddvA = vec_sr(multOddvA, i_qbitsv); \
+temp2v = (vec_s16_t) vec_packs(vec_mergeh(multEvenvA, multOddvA), vec_mergel(multEvenvA, multOddvA)); \
+temp2v = vec_xor(temp2v, mskA); \
+temp2v = vec_add(temp2v, vec_and(mskA, one)); \
+temp1v = vec_sel(temp1v, temp2v, sel); \
+vec_st(temp1v, (idx0), (int16_t*)dct);
+
+void x264_quant_2x2_dc_altivec( int16_t dct[2][2], int mf, int bias )
+{
+ vector bool short mskA;
+ vec_u32_t i_qbitsv;
+ vec_u16_t coefvA;
+ vec_u32_t multEvenvA, multOddvA;
+ vec_s16_t zerov, one;
+
+ vec_s16_t temp1v, temp2v;
+
+ vec_u16_t mfv;
+ vec_u16_t biasv;
+
+ vect_ushort_u mf_u;
+ mf_u.s[0]=mf;
+ mfv = vec_splat( mf_u.v, 0 );
+
+ vect_int_u qbits_u;
+ qbits_u.s[0]=16;
+ i_qbitsv = vec_splat(qbits_u.v, 0);
+
+ vect_ushort_u bias_u;
+ bias_u.s[0]=bias;
+ biasv = vec_splat(bias_u.v, 0);
+
+ zerov = vec_splat_s16(0);
+ one = vec_splat_s16(1);
+
+ QUANT_4_U_DC(0);
+}