Skip to content
Snippets Groups Projects
  • Kyle Siefring's avatar
    Improve density of group context setting macros · 4385e7e1
    Kyle Siefring authored and Ronald S. Bultje's avatar Ronald S. Bultje committed
    Shared object binary size reduction:
    x84_64           : 16112 bytes
    ARM64            : 16008 bytes
    ARM64(+Os)       : 21592 bytes
    ARMv7(+Os+mthumb): 18480 bytes
    
    Size reduction of symbols:
    x84_64           : 15712 bytes
    ARM64            : 18688 bytes
    ARM64(+Os)       : 18404 bytes
    ARMv7(+Os+mthumb): 17322 bytes
    
    Compiles were done with clang version 18.1.8 and symbol sizes were
    obtained using nm on the shared object.
    
    Provides speed ups on older ARM64 cpus with very little impact on other
    cpus.
    
    Speedup:
    
    c7i (skylake)
     Nature1080p      : x0.999
     Chimera          : x0.998
    
    odroid C4
     Nature1080p      : x1.007
     Chimera          : x1.016
     Models1080p      : x1.005
     MountainBike1080p: x1.009
     Balloons1080p    : x1.008
    
    Raspberry Pi 4
     Nature1080p      : x1.005
     Chimera          : x0.999
     Models1080p      : x0.999
     MountainBike1080p: x1.004
     Balloons1080p    : x1.003
    
    Raspberry Pi 2 (Cortex-A7):
     (using size optimized build)
     Nature1080p      : x1.003
     Models1080p      : x0.997
    4385e7e1
intops.h 2.60 KiB
/*
 * Copyright © 2018, VideoLAN and dav1d authors
 * Copyright © 2018, Two Orioles, LLC
 * All rights reserved.
 *
 * Redistribution and use in source and binary forms, with or without
 * modification, are permitted provided that the following conditions are met:
 *
 * 1. Redistributions of source code must retain the above copyright notice, this
 *    list of conditions and the following disclaimer.
 *
 * 2. Redistributions in binary form must reproduce the above copyright notice,
 *    this list of conditions and the following disclaimer in the documentation
 *    and/or other materials provided with the distribution.
 *
 * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS" AND
 * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
 * WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
 * DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE LIABLE FOR
 * ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES
 * (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES;
 * LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND
 * ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
 * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS
 * SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
 */

#ifndef DAV1D_COMMON_INTOPS_H
#define DAV1D_COMMON_INTOPS_H

#include <stdint.h>

#include "common/attributes.h"

static inline int imax(const int a, const int b) {
    return a > b ? a : b;
}

static inline int imin(const int a, const int b) {
    return a < b ? a : b;
}

static inline unsigned umax(const unsigned a, const unsigned b) {
    return a > b ? a : b;
}

static inline unsigned umin(const unsigned a, const unsigned b) {
    return a < b ? a : b;
}

static inline int iclip(const int v, const int min, const int max) {
    return v < min ? min : v > max ? max : v;
}

static inline int iclip_u8(const int v) {
    return iclip(v, 0, 255);
}

static inline int apply_sign(const int v, const int s) {
    return s < 0 ? -v : v;
}

static inline int apply_sign64(const int v, const int64_t s) {
    return s < 0 ? -v : v;
}

static inline int ulog2(const unsigned v) {
    return 31 ^ clz(v);
}
static inline int u64log2(const uint64_t v) {
    return 63 ^ clzll(v);
}

static inline unsigned inv_recenter(const unsigned r, const unsigned v) {
    if (v > (r << 1))
        return v;
    else if ((v & 1) == 0)
        return (v >> 1) + r;
    else
        return r - ((v + 1) >> 1);
}

#endif /* DAV1D_COMMON_INTOPS_H */