Optimize 0 0 0-3 search, 45% faster on pentium dual.
authorMichael Niedermayer <michaelni@gmx.at>
Tue, 23 Dec 2008 00:38:45 +0000 (00:38 +0000)
committerMichael Niedermayer <michaelni@gmx.at>
Tue, 23 Dec 2008 00:38:45 +0000 (00:38 +0000)
Originally committed as revision 16284 to svn://svn.ffmpeg.org/ffmpeg/trunk

libavcodec/h264.c

index a170177fa4aef055b5b653769a94943d52d7037a..1e5ac60520a74ba1d6ea2fb0dc4f739ebe7ca1f5 100644 (file)
@@ -1375,9 +1375,26 @@ static const uint8_t *decode_nal(H264Context *h, const uint8_t *src, int *dst_le
     for(i=0; i<length; i++)
         printf("%2X ", src[i]);
 #endif
+
+#ifdef HAVE_FAST_UNALIGNED
+# ifdef HAVE_FAST_64BIT
+#   define RS 7
+    for(i=0; i+1<length; i+=9){
+        if(!((~*(uint64_t*)(src+i) & (*(uint64_t*)(src+i) - 0x0100010001000101ULL)) & 0x8000800080008080ULL))
+# else
+#   define RS 3
+    for(i=0; i+1<length; i+=5){
+        if(!((~*(uint32_t*)(src+i) & (*(uint32_t*)(src+i) - 0x01000101U)) & 0x80008080U))
+# endif
+            continue;
+        if(i>0 && !src[i]) i--;
+        while(src[i]) i++;
+#else
+#   define RS 0
     for(i=0; i+1<length; i+=2){
         if(src[i]) continue;
         if(i>0 && src[i-1]==0) i--;
+#endif
         if(i+2<length && src[i+1]==0 && src[i+2]<=3){
             if(src[i+2]!=3){
                 /* startcode, so we must be past the end */