ogg/openh264/libde265/thorのコードを最新化 (libvpxは #2 により更新見送り)

kazuki · Oct 31, 2015 · 609e653 · 609e653
1 parent 143096a
commit 609e653
Show file tree

Hide file tree

Showing 6 changed files with 21 additions and 60 deletions.
diff --git a/native/libde265 b/native/libde265
diff --git a/native/libde265_binding.cc b/native/libde265_binding.cc
@@ -5,16 +5,16 @@ extern "C" {
 
 void libde265_encoder_hack(encoder_context *ctx, int w, int h)
 {
-    ctx->sps.set_defaults();
-    ctx->sps.set_resolution(w, h);
-    ctx->sps.compute_derived_values();
+    //ctx->sps.set_defaults();
+    //ctx->sps.set_resolution(w, h);
+    //ctx->sps.compute_derived_values();
 }
 
 de265_image *libde265_image_allocate(encoder_context *ctx, int w, int h)
 {
     de265_image *img = new de265_image;
-    img->alloc_image(w, h, de265_chroma_420, &ctx->sps, false,
-                     NULL, ctx, 0, NULL, false);
+    //img->alloc_image(w, h, de265_chroma_420, &ctx->sps, false,
+    //NULL, ctx, 0, NULL, false);
     return img;
 }
 

diff --git a/native/ogg b/native/ogg
diff --git a/native/openh264 b/native/openh264
diff --git a/native/thor b/native/thor
diff --git a/native/thor.patch b/native/thor.patch
@@ -1,52 +1,13 @@
-commit 136fb23d432322978012e9b3198f50b9195ecc2e
-Author: Kazuki Oikawa <[email protected]>
-Date:   Mon Jul 27 20:35:12 2015 +0900
-
-    Fix compile error when use SIMD C emulation mode
-
-diff --git a/common/common_kernels.c b/common/common_kernels.c
-index 04f43be..b5e1307 100644
---- a/common/common_kernels.c
-+++ b/common/common_kernels.c
-@@ -194,13 +194,13 @@ static void get_inter_prediction_luma_inner(int width, int height, int xoff, int
-
-     for (int y = 0; y < height; y++) {
-       int res;
--      v128 ax = v128_unpacklo_u8_s16(v64_load_unaligned(ip - 2));
--      v128 a0 = v128_mullo_s16(c0, v128_unpacklo_u8_s16(v64_load_unaligned(ip - 2 * istride - 2)));
--      v128 a1 = v128_mullo_s16(c1, v128_unpacklo_u8_s16(v64_load_unaligned(ip - 1 * istride - 2)));
-+      v128 ax = v128_unpack_u8_s16(v64_load_unaligned(ip - 2));
-+      v128 a0 = v128_mullo_s16(c0, v128_unpack_u8_s16(v64_load_unaligned(ip - 2 * istride - 2)));
-+      v128 a1 = v128_mullo_s16(c1, v128_unpack_u8_s16(v64_load_unaligned(ip - 1 * istride - 2)));
-       v128 a2 = v128_mullo_s16(c2, ax);
--      v128 a3 = v128_mullo_s16(c3, v128_unpacklo_u8_s16(v64_load_unaligned(ip + 1 * istride - 2)));
--      v128 a4 = v128_mullo_s16(c4, v128_unpacklo_u8_s16(v64_load_unaligned(ip + 2 * istride - 2)));
--      v128 a5 = v128_mullo_s16(c5, v128_unpacklo_u8_s16(v64_load_unaligned(ip + 3 * istride - 2)));
-+      v128 a3 = v128_mullo_s16(c3, v128_unpack_u8_s16(v64_load_unaligned(ip + 1 * istride - 2)));
-+      v128 a4 = v128_mullo_s16(c4, v128_unpack_u8_s16(v64_load_unaligned(ip + 2 * istride - 2)));
-+      v128 a5 = v128_mullo_s16(c5, v128_unpack_u8_s16(v64_load_unaligned(ip + 3 * istride - 2)));
-
-       for (int x = 0; x < 3; x++) {
-         res = (v128_dotp_s16(c, v128_add_16(v128_add_16(v128_add_16(v128_add_16(v128_add_16(a0, a1), a2), a3), a4), a5)) + v128_dotp_s16(c, ax) * 128 + 8192) >> 14;
-@@ -315,7 +315,7 @@ static void get_inter_prediction_luma_centre(int width, int height,
-                                              const uint8_t *restrict ip, int istride)
- {
-   if (width == 4) {
--    v128 round = v128_dup_16(8);
-+    v64 round = v64_dup_16(8);
-     for (int i = 0; i < height; i++) {
-       v64 r, s;
-       r = v64_add_16(v64_unpacklo_u8_s16(v64_from_32(0, u32_load_unaligned(ip - 1 * istride + 0))),
-diff --git a/Makefile b/Makefile
-index 5ca91df..6291a4b 100644
---- a/Makefile
-+++ b/Makefile
+diff --git a/common/temporal_interp.c b/common/temporal_interp.c
+index c01747c..1209f38 100644
+--- a/common/temporal_interp.c
++++ b/common/temporal_interp.c
 @@ -1,7 +1,7 @@
- ENCODER_PROGRAM = build/Thorenc
- DECODER_PROGRAM = build/Thordec
-
--CFLAGS += -std=c99 -g -O6 -Wall -pedantic -I common
-+CFLAGS += -std=c99 -g -O2 -Wall -pedantic -I common
- LDFLAGS = -lm
-
- ifeq ($(ARCH),neon)
+ #include <math.h>
+ #include <assert.h>
+ #include <string.h>
+-#include "emmintrin.h"
++//#include "emmintrin.h"
+ #include "simd.h"
+ #include "global.h"
+ #include "temporal_interp.h"