• François Cartegnie's avatar
    x86: add SSSE3 mc prep_8tap implementation · 0afec6b1
    François Cartegnie authored
    ```------------------
    x86_64:
    ```
    
    ---------------------------------------
    mct_8tap_regular_w4_0_8bpc_c: 115.6
    mct_8tap_regular_w4_0_8bpc_ssse3: 13.1
    mct_8tap_regular_w4_0_8bpc_avx2: 13.3
    ------------------------------------------
    mct_8tap_regular_w4_h_8bpc_c: 363.0
    mct_8tap_regular_w4_h_8bpc_ssse3: 19.1
    mct_8tap_regular_w4_h_8bpc_avx2: 16.5
    ------------------------------------------
    mct_8tap_regular_w4_hv_8bpc_c: 832.2
    mct_8tap_regular_w4_hv_8bpc_ssse3: 113.4
    mct_8tap_regular_w4_hv_8bpc_avx2: 53.1
    ------------------------------------------
    mct_8tap_regular_w4_v_8bpc_c: 488.5
    mct_8tap_regular_w4_v_8bpc_ssse3: 38.9
    mct_8tap_regular_w4_v_8bpc_avx2: 26.0
    ------------------------------------------
    mct_8tap_regular_w8_0_8bpc_c: 259.3
    mct_8tap_regular_w8_0_8bpc_ssse3: 20.4
    mct_8tap_regular_w8_0_8bpc_avx2: 18.0
    ------------------------------------------
    mct_8tap_regular_w8_h_8bpc_c: 1124.3
    mct_8tap_regular_w8_h_8bpc_ssse3: 67.7
    mct_8tap_regular_w8_h_8bpc_avx2: 43.3
    ------------------------------------------
    mct_8tap_regular_w8_hv_8bpc_c: 2155.0
    mct_8tap_regular_w8_hv_8bpc_ssse3: 340.8
    mct_8tap_regular_w8_hv_8bpc_avx2: 151.3
    ------------------------------------------
    mct_8tap_regular_w8_v_8bpc_c: 1195.4
    mct_8tap_regular_w8_v_8bpc_ssse3: 72.4
    mct_8tap_regular_w8_v_8bpc_avx2: 39.8
    ------------------------------------------
    mct_8tap_regular_w16_0_8bpc_c: 158.3
    mct_8tap_regular_w16_0_8bpc_ssse3: 52.9
    mct_8tap_regular_w16_0_8bpc_avx2: 30.2
    ------------------------------------------
    mct_8tap_regular_w16_h_8bpc_c: 4267.4
    mct_8tap_regular_w16_h_8bpc_ssse3: 211.9
    mct_8tap_regular_w16_h_8bpc_avx2: 121.4
    ------------------------------------------
    mct_8tap_regular_w16_hv_8bpc_c: 5430.9
    mct_8tap_regular_w16_hv_8bpc_ssse3: 986.8
    mct_8tap_regular_w16_hv_8bpc_avx2: 428.4
    ------------------------------------------
    mct_8tap_regular_w16_v_8bpc_c: 4604.2
    mct_8tap_regular_w16_v_8bpc_ssse3: 199.1
    mct_8tap_regular_w16_v_8bpc_avx2: 100.7
    ------------------------------------------
    mct_8tap_regular_w32_0_8bpc_c: 372.9
    mct_8tap_regular_w32_0_8bpc_ssse3: 231.9
    mct_8tap_regular_w32_0_8bpc_avx2: 99.7
    ------------------------------------------
    mct_8tap_regular_w32_h_8bpc_c: 15975.0
    mct_8tap_regular_w32_h_8bpc_ssse3: 802.9
    mct_8tap_regular_w32_h_8bpc_avx2: 468.5
    ------------------------------------------
    mct_8tap_regular_w32_hv_8bpc_c: 18555.5
    mct_8tap_regular_w32_hv_8bpc_ssse3: 3673.5
    mct_8tap_regular_w32_hv_8bpc_avx2: 1587.6
    ------------------------------------------
    mct_8tap_regular_w32_v_8bpc_c: 16632.4
    mct_8tap_regular_w32_v_8bpc_ssse3: 743.5
    mct_8tap_regular_w32_v_8bpc_avx2: 337.8
    ------------------------------------------
    mct_8tap_regular_w64_0_8bpc_c: 675.9
    mct_8tap_regular_w64_0_8bpc_ssse3: 513.6
    mct_8tap_regular_w64_0_8bpc_avx2: 285.4
    ------------------------------------------
    mct_8tap_regular_w64_h_8bpc_c: 37161.3
    mct_8tap_regular_w64_h_8bpc_ssse3: 1929.7
    mct_8tap_regular_w64_h_8bpc_avx2: 1138.1
    ------------------------------------------
    mct_8tap_regular_w64_hv_8bpc_c: 42434.0
    mct_8tap_regular_w64_hv_8bpc_ssse3: 8822.1
    mct_8tap_regular_w64_hv_8bpc_avx2: 3853.5
    ------------------------------------------
    mct_8tap_regular_w64_v_8bpc_c: 37969.1
    mct_8tap_regular_w64_v_8bpc_ssse3: 1805.6
    mct_8tap_regular_w64_v_8bpc_avx2: 826.1
    ------------------------------------------
    mct_8tap_regular_w128_0_8bpc_c: 1532.7
    mct_8tap_regular_w128_0_8bpc_ssse3: 1397.7
    mct_8tap_regular_w128_0_8bpc_avx2: 813.8
    ------------------------------------------
    mct_8tap_regular_w128_h_8bpc_c: 91204.3
    mct_8tap_regular_w128_h_8bpc_ssse3: 4783.0
    mct_8tap_regular_w128_h_8bpc_avx2: 2767.2
    ------------------------------------------
    mct_8tap_regular_w128_hv_8bpc_c: 102396.0
    mct_8tap_regular_w128_hv_8bpc_ssse3: 22202.3
    mct_8tap_regular_w128_hv_8bpc_avx2: 9637.2
    ------------------------------------------
    mct_8tap_regular_w128_v_8bpc_c: 92294.3
    mct_8tap_regular_w128_v_8bpc_ssse3: 4952.8
    mct_8tap_regular_w128_v_8bpc_avx2: 2370.1
    ------------------------------------------
    
    ---------------------
    x86_32:
    ------------------------------------------
    mct_8tap_regular_w4_0_8bpc_c: 131.3
    mct_8tap_regular_w4_0_8bpc_ssse3: 18.7
    ------------------------------------------
    mct_8tap_regular_w4_h_8bpc_c: 422.0
    mct_8tap_regular_w4_h_8bpc_ssse3: 27.3
    ------------------------------------------
    mct_8tap_regular_w4_hv_8bpc_c: 1012.6
    mct_8tap_regular_w4_hv_8bpc_ssse3: 123.6
    ------------------------------------------
    mct_8tap_regular_w4_v_8bpc_c: 589.6
    mct_8tap_regular_w4_v_8bpc_ssse3: 48.9
    ------------------------------------------
    mct_8tap_regular_w8_0_8bpc_c: 278.5
    mct_8tap_regular_w8_0_8bpc_ssse3: 26.3
    ------------------------------------------
    mct_8tap_regular_w8_h_8bpc_c: 1129.3
    mct_8tap_regular_w8_h_8bpc_ssse3: 80.6
    ------------------------------------------
    mct_8tap_regular_w8_hv_8bpc_c: 2556.4
    mct_8tap_regular_w8_hv_8bpc_ssse3: 354.6
    ------------------------------------------
    mct_8tap_regular_w8_v_8bpc_c: 1460.2
    mct_8tap_regular_w8_v_8bpc_ssse3: 103.8
    ------------------------------------------
    mct_8tap_regular_w16_0_8bpc_c: 218.9
    mct_8tap_regular_w16_0_8bpc_ssse3: 58.4
    ------------------------------------------
    mct_8tap_regular_w16_h_8bpc_c: 4471.8
    mct_8tap_regular_w16_h_8bpc_ssse3: 237.2
    ------------------------------------------
    mct_8tap_regular_w16_hv_8bpc_c: 5570.5
    mct_8tap_regular_w16_hv_8bpc_ssse3: 1044.1
    ------------------------------------------
    mct_8tap_regular_w16_v_8bpc_c: 4885.5
    mct_8tap_regular_w16_v_8bpc_ssse3: 268.3
    ------------------------------------------
    mct_8tap_regular_w32_0_8bpc_c: 495.6
    mct_8tap_regular_w32_0_8bpc_ssse3: 236.6
    ------------------------------------------
    mct_8tap_regular_w32_h_8bpc_c: 15903.5
    mct_8tap_regular_w32_h_8bpc_ssse3: 872.5
    ------------------------------------------
    mct_8tap_regular_w32_hv_8bpc_c: 19402.2
    mct_8tap_regular_w32_hv_8bpc_ssse3: 3832.8
    ------------------------------------------
    mct_8tap_regular_w32_v_8bpc_c: 17119.5
    mct_8tap_regular_w32_v_8bpc_ssse3: 935.2
    ------------------------------------------
    mct_8tap_regular_w64_0_8bpc_c: 877.0
    mct_8tap_regular_w64_0_8bpc_ssse3: 515.7
    ------------------------------------------
    mct_8tap_regular_w64_h_8bpc_c: 36832.1
    mct_8tap_regular_w64_h_8bpc_ssse3: 2094.1
    ------------------------------------------
    mct_8tap_regular_w64_hv_8bpc_c: 43965.3
    mct_8tap_regular_w64_hv_8bpc_ssse3: 9423.0
    ------------------------------------------
    mct_8tap_regular_w64_v_8bpc_c: 37041.2
    mct_8tap_regular_w64_v_8bpc_ssse3: 2348.9
    ------------------------------------------
    mct_8tap_regular_w128_0_8bpc_c: 1929.9
    mct_8tap_regular_w128_0_8bpc_ssse3: 1392.3
    ------------------------------------------
    mct_8tap_regular_w128_h_8bpc_c: 86022.5
    mct_8tap_regular_w128_h_8bpc_ssse3: 5110.8
    ------------------------------------------
    mct_8tap_regular_w128_hv_8bpc_c: 105793.5
    mct_8tap_regular_w128_hv_8bpc_ssse3: 23278.8
    ------------------------------------------
    mct_8tap_regular_w128_v_8bpc_c: 88223.5
    mct_8tap_regular_w128_v_8bpc_ssse3: 7442.7
    ------------------------------------------
    0afec6b1
Name
Last commit
Last update
..
arm Loading commit data...
ext/x86 Loading commit data...
win32 Loading commit data...
x86 Loading commit data...
cdef.h Loading commit data...
cdef_apply.h Loading commit data...
cdef_apply_tmpl.c Loading commit data...
cdef_tmpl.c Loading commit data...
cdf.c Loading commit data...
cdf.h Loading commit data...
cpu.c Loading commit data...
cpu.h Loading commit data...
ctx.h Loading commit data...
data.c Loading commit data...
data.h Loading commit data...
dav1d.rc.in Loading commit data...
decode.c Loading commit data...
decode.h Loading commit data...
dequant_tables.c Loading commit data...
dequant_tables.h Loading commit data...
env.h Loading commit data...
film_grain.h Loading commit data...
film_grain_tmpl.c Loading commit data...
getbits.c Loading commit data...
getbits.h Loading commit data...
internal.h Loading commit data...
intra_edge.c Loading commit data...
intra_edge.h Loading commit data...
ipred.h Loading commit data...
ipred_prepare.h Loading commit data...
ipred_prepare_tmpl.c Loading commit data...
ipred_tmpl.c Loading commit data...
itx.h Loading commit data...
itx_1d.c Loading commit data...
itx_tmpl.c Loading commit data...
levels.h Loading commit data...
lf_apply.h Loading commit data...
lf_apply_tmpl.c Loading commit data...
lf_mask.c Loading commit data...
lf_mask.h Loading commit data...
lib.c Loading commit data...
log.c Loading commit data...
log.h Loading commit data...
loopfilter.h Loading commit data...
loopfilter_tmpl.c Loading commit data...
looprestoration.h Loading commit data...
looprestoration_tmpl.c Loading commit data...
lr_apply.h Loading commit data...
lr_apply_tmpl.c Loading commit data...
mc.h Loading commit data...
mc_tmpl.c Loading commit data...
meson.build Loading commit data...
msac.c Loading commit data...
msac.h Loading commit data...
obu.c Loading commit data...
obu.h Loading commit data...
picture.c Loading commit data...
picture.h Loading commit data...
qm.c Loading commit data...
qm.h Loading commit data...
recon.h Loading commit data...
recon_tmpl.c Loading commit data...
ref.c Loading commit data...
ref.h Loading commit data...
ref_mvs.c Loading commit data...
ref_mvs.h Loading commit data...
scan.c Loading commit data...
scan.h Loading commit data...
tables.c Loading commit data...
tables.h Loading commit data...
thread.h Loading commit data...
thread_data.h Loading commit data...
thread_task.c Loading commit data...
thread_task.h Loading commit data...
warpmv.c Loading commit data...
warpmv.h Loading commit data...
wedge.c Loading commit data...
wedge.h Loading commit data...