mirror of
				https://github.com/GrapheneOS/hardened_malloc.git
				synced 2025-11-04 09:46:32 +01:00 
			
		
		
		
	Compare commits
	
		
			11 commits
		
	
	
		
			885a0490d0
			...
			de4df3d119
		
	
	| Author | SHA1 | Date | |
|---|---|---|---|
| 
							 | 
						de4df3d119 | ||
| 
							 | 
						ffcfeee69f | ||
| 
							 | 
						ff99511eb4 | ||
| 
							 | 
						c392d40843 | ||
| 
							 | 
						7481c8857f | ||
| 
							 | 
						1d7fc7ffe0 | ||
| 
							 | 
						4fe9018b6f | ||
| 
							 | 
						3ab23f7ebf | ||
| 
							 | 
						c894f3ec1d | ||
| 
							 | 
						c97263ef0c | ||
| 
							 | 
						a7302add63 | 
					 9 changed files with 79 additions and 39 deletions
				
			
		
							
								
								
									
										14
									
								
								.github/workflows/build-and-test.yml
									
										
									
									
										vendored
									
									
								
							
							
						
						
									
										14
									
								
								.github/workflows/build-and-test.yml
									
										
									
									
										vendored
									
									
								
							| 
						 | 
					@ -11,9 +11,9 @@ jobs:
 | 
				
			||||||
    runs-on: ubuntu-latest
 | 
					    runs-on: ubuntu-latest
 | 
				
			||||||
    strategy:
 | 
					    strategy:
 | 
				
			||||||
      matrix:
 | 
					      matrix:
 | 
				
			||||||
        version: [12]
 | 
					        version: [12, 13, 14]
 | 
				
			||||||
    steps:
 | 
					    steps:
 | 
				
			||||||
      - uses: actions/checkout@v4
 | 
					      - uses: actions/checkout@v5
 | 
				
			||||||
      - name: Setting up gcc version
 | 
					      - name: Setting up gcc version
 | 
				
			||||||
        run: |
 | 
					        run: |
 | 
				
			||||||
          sudo update-alternatives --install /usr/bin/g++ g++ /usr/bin/g++-${{ matrix.version }} 100
 | 
					          sudo update-alternatives --install /usr/bin/g++ g++ /usr/bin/g++-${{ matrix.version }} 100
 | 
				
			||||||
| 
						 | 
					@ -24,9 +24,11 @@ jobs:
 | 
				
			||||||
    runs-on: ubuntu-latest
 | 
					    runs-on: ubuntu-latest
 | 
				
			||||||
    strategy:
 | 
					    strategy:
 | 
				
			||||||
      matrix:
 | 
					      matrix:
 | 
				
			||||||
        version: [14, 15]
 | 
					        version: [14, 15, 16, 17, 18]
 | 
				
			||||||
    steps:
 | 
					    steps:
 | 
				
			||||||
      - uses: actions/checkout@v4
 | 
					      - uses: actions/checkout@v5
 | 
				
			||||||
 | 
					      - name: Install dependencies
 | 
				
			||||||
 | 
					        run: sudo apt-get update && sudo apt-get install -y --no-install-recommends clang-14 clang-15
 | 
				
			||||||
      - name: Setting up clang version
 | 
					      - name: Setting up clang version
 | 
				
			||||||
        run: |
 | 
					        run: |
 | 
				
			||||||
          sudo update-alternatives --install /usr/bin/clang++ clang++ /usr/bin/clang++-${{ matrix.version }} 100
 | 
					          sudo update-alternatives --install /usr/bin/clang++ clang++ /usr/bin/clang++-${{ matrix.version }} 100
 | 
				
			||||||
| 
						 | 
					@ -38,7 +40,7 @@ jobs:
 | 
				
			||||||
    container:
 | 
					    container:
 | 
				
			||||||
      image: alpine:latest
 | 
					      image: alpine:latest
 | 
				
			||||||
    steps:
 | 
					    steps:
 | 
				
			||||||
      - uses: actions/checkout@v4
 | 
					      - uses: actions/checkout@v5
 | 
				
			||||||
      - name: Install dependencies
 | 
					      - name: Install dependencies
 | 
				
			||||||
        run: apk update && apk add build-base python3
 | 
					        run: apk update && apk add build-base python3
 | 
				
			||||||
      - name: Build
 | 
					      - name: Build
 | 
				
			||||||
| 
						 | 
					@ -46,7 +48,7 @@ jobs:
 | 
				
			||||||
  build-ubuntu-gcc-aarch64:
 | 
					  build-ubuntu-gcc-aarch64:
 | 
				
			||||||
    runs-on: ubuntu-latest
 | 
					    runs-on: ubuntu-latest
 | 
				
			||||||
    steps:
 | 
					    steps:
 | 
				
			||||||
      - uses: actions/checkout@v4
 | 
					      - uses: actions/checkout@v5
 | 
				
			||||||
      - name: Install dependencies
 | 
					      - name: Install dependencies
 | 
				
			||||||
        run: sudo apt-get update && sudo apt-get install -y --no-install-recommends gcc-aarch64-linux-gnu g++-aarch64-linux-gnu libgcc-s1-arm64-cross cpp-aarch64-linux-gnu
 | 
					        run: sudo apt-get update && sudo apt-get install -y --no-install-recommends gcc-aarch64-linux-gnu g++-aarch64-linux-gnu libgcc-s1-arm64-cross cpp-aarch64-linux-gnu
 | 
				
			||||||
      - name: Build
 | 
					      - name: Build
 | 
				
			||||||
| 
						 | 
					
 | 
				
			||||||
							
								
								
									
										2
									
								
								LICENSE
									
										
									
									
									
								
							
							
						
						
									
										2
									
								
								LICENSE
									
										
									
									
									
								
							| 
						 | 
					@ -1,4 +1,4 @@
 | 
				
			||||||
Copyright © 2018-2024 GrapheneOS
 | 
					Copyright © 2018-2025 GrapheneOS
 | 
				
			||||||
 | 
					
 | 
				
			||||||
Permission is hereby granted, free of charge, to any person obtaining a copy
 | 
					Permission is hereby granted, free of charge, to any person obtaining a copy
 | 
				
			||||||
of this software and associated documentation files (the "Software"), to deal
 | 
					of this software and associated documentation files (the "Software"), to deal
 | 
				
			||||||
| 
						 | 
					
 | 
				
			||||||
							
								
								
									
										14
									
								
								README.md
									
										
									
									
									
								
							
							
						
						
									
										14
									
								
								README.md
									
										
									
									
									
								
							| 
						 | 
					@ -65,14 +65,14 @@ used instead as this allocator fundamentally doesn't support that environment.
 | 
				
			||||||
 | 
					
 | 
				
			||||||
## Dependencies
 | 
					## Dependencies
 | 
				
			||||||
 | 
					
 | 
				
			||||||
Debian stable (currently Debian 12) determines the most ancient set of
 | 
					Debian stable (currently Debian 13) determines the most ancient set of
 | 
				
			||||||
supported dependencies:
 | 
					supported dependencies:
 | 
				
			||||||
 | 
					
 | 
				
			||||||
* glibc 2.36
 | 
					* glibc 2.41
 | 
				
			||||||
* Linux 6.1
 | 
					* Linux 6.12
 | 
				
			||||||
* Clang 14.0.6 or GCC 12.2.0
 | 
					* Clang 19.1.7 or GCC 14.2.0
 | 
				
			||||||
 | 
					
 | 
				
			||||||
For Android, the Linux GKI 5.10, 5.15 and 6.1 branches are supported.
 | 
					For Android, the Linux GKI 6.1, 6.6 and 6.12 branches are supported.
 | 
				
			||||||
 | 
					
 | 
				
			||||||
However, using more recent releases is highly recommended. Older versions of
 | 
					However, using more recent releases is highly recommended. Older versions of
 | 
				
			||||||
the dependencies may be compatible at the moment but are not tested and will
 | 
					the dependencies may be compatible at the moment but are not tested and will
 | 
				
			||||||
| 
						 | 
					@ -83,7 +83,7 @@ there will be custom integration offering better performance in the future
 | 
				
			||||||
along with other hardening for the C standard library implementation.
 | 
					along with other hardening for the C standard library implementation.
 | 
				
			||||||
 | 
					
 | 
				
			||||||
For Android, only the current generation, actively developed maintenance branch of the Android
 | 
					For Android, only the current generation, actively developed maintenance branch of the Android
 | 
				
			||||||
Open Source Project will be supported, which currently means `android13-qpr2-release`.
 | 
					Open Source Project will be supported, which currently means `android16-release`.
 | 
				
			||||||
 | 
					
 | 
				
			||||||
## Testing
 | 
					## Testing
 | 
				
			||||||
 | 
					
 | 
				
			||||||
| 
						 | 
					@ -160,7 +160,7 @@ The format of this configuration file is a whitespace-separated list, so it's
 | 
				
			||||||
good practice to put each library on a separate line.
 | 
					good practice to put each library on a separate line.
 | 
				
			||||||
 | 
					
 | 
				
			||||||
For maximum compatibility `libhardened_malloc.so` can be installed into
 | 
					For maximum compatibility `libhardened_malloc.so` can be installed into
 | 
				
			||||||
`/usr/lib/` to avoid preload failures caused by AppArmor profile or systemd
 | 
					`/usr/lib/` to avoid preload failures caused by AppArmor profiles or systemd
 | 
				
			||||||
ExecPaths= restrictions. Check for logs of the following format:
 | 
					ExecPaths= restrictions. Check for logs of the following format:
 | 
				
			||||||
 | 
					
 | 
				
			||||||
    ERROR: ld.so: object '/usr/local/lib/libhardened_malloc.so' from /etc/ld.so.preload cannot be preloaded (failed to map segment from shared object): ignored.
 | 
					    ERROR: ld.so: object '/usr/local/lib/libhardened_malloc.so' from /etc/ld.so.preload cannot be preloaded (failed to map segment from shared object): ignored.
 | 
				
			||||||
| 
						 | 
					
 | 
				
			||||||
| 
						 | 
					@ -44,7 +44,7 @@ void *set_pointer_tag(void *ptr, u8 tag) {
 | 
				
			||||||
    return (void *) (((uintptr_t) tag << 56) | (uintptr_t) untag_pointer(ptr));
 | 
					    return (void *) (((uintptr_t) tag << 56) | (uintptr_t) untag_pointer(ptr));
 | 
				
			||||||
}
 | 
					}
 | 
				
			||||||
 | 
					
 | 
				
			||||||
// This test checks that slab slot allocation uses tag that is distint from tags of its neighbors
 | 
					// This test checks that slab slot allocation uses tag that is distinct from tags of its neighbors
 | 
				
			||||||
// and from the tag of the previous allocation that used the same slot
 | 
					// and from the tag of the previous allocation that used the same slot
 | 
				
			||||||
void tag_distinctness() {
 | 
					void tag_distinctness() {
 | 
				
			||||||
    // tag 0 is reserved
 | 
					    // tag 0 is reserved
 | 
				
			||||||
| 
						 | 
					
 | 
				
			||||||
							
								
								
									
										2
									
								
								chacha.c
									
										
									
									
									
								
							
							
						
						
									
										2
									
								
								chacha.c
									
										
									
									
									
								
							| 
						 | 
					@ -41,7 +41,7 @@ static const unsigned rounds = 8;
 | 
				
			||||||
    a = PLUS(a, b); d = ROTATE(XOR(d, a), 8); \
 | 
					    a = PLUS(a, b); d = ROTATE(XOR(d, a), 8); \
 | 
				
			||||||
    c = PLUS(c, d); b = ROTATE(XOR(b, c), 7);
 | 
					    c = PLUS(c, d); b = ROTATE(XOR(b, c), 7);
 | 
				
			||||||
 | 
					
 | 
				
			||||||
static const char sigma[16] = "expand 32-byte k";
 | 
					static const char sigma[16] NONSTRING = "expand 32-byte k";
 | 
				
			||||||
 | 
					
 | 
				
			||||||
void chacha_keysetup(chacha_ctx *x, const u8 *k) {
 | 
					void chacha_keysetup(chacha_ctx *x, const u8 *k) {
 | 
				
			||||||
    x->input[0] = U8TO32_LITTLE(sigma + 0);
 | 
					    x->input[0] = U8TO32_LITTLE(sigma + 0);
 | 
				
			||||||
| 
						 | 
					
 | 
				
			||||||
| 
						 | 
					@ -98,7 +98,7 @@ class TestSimpleMemoryCorruption(unittest.TestCase):
 | 
				
			||||||
        self.assertEqual(stderr.decode("utf-8"),
 | 
					        self.assertEqual(stderr.decode("utf-8"),
 | 
				
			||||||
                         "fatal allocator error: invalid free\n")
 | 
					                         "fatal allocator error: invalid free\n")
 | 
				
			||||||
 | 
					
 | 
				
			||||||
    def test_invalid_malloc_usable_size_small_quarantene(self):
 | 
					    def test_invalid_malloc_usable_size_small_quarantine(self):
 | 
				
			||||||
        _stdout, stderr, returncode = self.run_test(
 | 
					        _stdout, stderr, returncode = self.run_test(
 | 
				
			||||||
            "invalid_malloc_usable_size_small_quarantine")
 | 
					            "invalid_malloc_usable_size_small_quarantine")
 | 
				
			||||||
        self.assertEqual(returncode, -6)
 | 
					        self.assertEqual(returncode, -6)
 | 
				
			||||||
| 
						 | 
					
 | 
				
			||||||
							
								
								
									
										75
									
								
								third_party/libdivide.h
									
										
									
									
										vendored
									
									
								
							
							
						
						
									
										75
									
								
								third_party/libdivide.h
									
										
									
									
										vendored
									
									
								
							| 
						 | 
					@ -11,9 +11,11 @@
 | 
				
			||||||
#ifndef LIBDIVIDE_H
 | 
					#ifndef LIBDIVIDE_H
 | 
				
			||||||
#define LIBDIVIDE_H
 | 
					#define LIBDIVIDE_H
 | 
				
			||||||
 | 
					
 | 
				
			||||||
#define LIBDIVIDE_VERSION "5.1"
 | 
					// *** Version numbers are auto generated - do not edit ***
 | 
				
			||||||
 | 
					#define LIBDIVIDE_VERSION "5.2.0"
 | 
				
			||||||
#define LIBDIVIDE_VERSION_MAJOR 5
 | 
					#define LIBDIVIDE_VERSION_MAJOR 5
 | 
				
			||||||
#define LIBDIVIDE_VERSION_MINOR 1
 | 
					#define LIBDIVIDE_VERSION_MINOR 2
 | 
				
			||||||
 | 
					#define LIBDIVIDE_VERSION_PATCH 0
 | 
				
			||||||
 | 
					
 | 
				
			||||||
#include <stdint.h>
 | 
					#include <stdint.h>
 | 
				
			||||||
 | 
					
 | 
				
			||||||
| 
						 | 
					@ -34,8 +36,15 @@
 | 
				
			||||||
#include <arm_neon.h>
 | 
					#include <arm_neon.h>
 | 
				
			||||||
#endif
 | 
					#endif
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					// Clang-cl prior to Visual Studio 2022 doesn't include __umulh/__mulh intrinsics
 | 
				
			||||||
 | 
					#if defined(_MSC_VER) && defined(LIBDIVIDE_X86_64) && (!defined(__clang__) || _MSC_VER>1930)
 | 
				
			||||||
 | 
					#define LIBDIVIDE_X64_INTRINSICS
 | 
				
			||||||
 | 
					#endif
 | 
				
			||||||
 | 
					
 | 
				
			||||||
#if defined(_MSC_VER)
 | 
					#if defined(_MSC_VER)
 | 
				
			||||||
 | 
					#if defined(LIBDIVIDE_X64_INTRINSICS)
 | 
				
			||||||
#include <intrin.h>
 | 
					#include <intrin.h>
 | 
				
			||||||
 | 
					#endif
 | 
				
			||||||
#pragma warning(push)
 | 
					#pragma warning(push)
 | 
				
			||||||
// disable warning C4146: unary minus operator applied
 | 
					// disable warning C4146: unary minus operator applied
 | 
				
			||||||
// to unsigned type, result still unsigned
 | 
					// to unsigned type, result still unsigned
 | 
				
			||||||
| 
						 | 
					@ -238,18 +247,28 @@ static LIBDIVIDE_INLINE struct libdivide_u32_branchfree_t libdivide_u32_branchfr
 | 
				
			||||||
static LIBDIVIDE_INLINE struct libdivide_s64_branchfree_t libdivide_s64_branchfree_gen(int64_t d);
 | 
					static LIBDIVIDE_INLINE struct libdivide_s64_branchfree_t libdivide_s64_branchfree_gen(int64_t d);
 | 
				
			||||||
static LIBDIVIDE_INLINE struct libdivide_u64_branchfree_t libdivide_u64_branchfree_gen(uint64_t d);
 | 
					static LIBDIVIDE_INLINE struct libdivide_u64_branchfree_t libdivide_u64_branchfree_gen(uint64_t d);
 | 
				
			||||||
 | 
					
 | 
				
			||||||
static LIBDIVIDE_INLINE int16_t libdivide_s16_do_raw(int16_t numer, int16_t magic, uint8_t more);
 | 
					static LIBDIVIDE_INLINE int16_t libdivide_s16_do_raw(
 | 
				
			||||||
 | 
					    int16_t numer, int16_t magic, uint8_t more);
 | 
				
			||||||
static LIBDIVIDE_INLINE int16_t libdivide_s16_do(
 | 
					static LIBDIVIDE_INLINE int16_t libdivide_s16_do(
 | 
				
			||||||
    int16_t numer, const struct libdivide_s16_t *denom);
 | 
					    int16_t numer, const struct libdivide_s16_t *denom);
 | 
				
			||||||
static LIBDIVIDE_INLINE uint16_t libdivide_u16_do_raw(uint16_t numer, uint16_t magic, uint8_t more);
 | 
					static LIBDIVIDE_INLINE uint16_t libdivide_u16_do_raw(
 | 
				
			||||||
 | 
					    uint16_t numer, uint16_t magic, uint8_t more);
 | 
				
			||||||
static LIBDIVIDE_INLINE uint16_t libdivide_u16_do(
 | 
					static LIBDIVIDE_INLINE uint16_t libdivide_u16_do(
 | 
				
			||||||
    uint16_t numer, const struct libdivide_u16_t *denom);
 | 
					    uint16_t numer, const struct libdivide_u16_t *denom);
 | 
				
			||||||
 | 
					static LIBDIVIDE_INLINE int32_t libdivide_s32_do_raw(
 | 
				
			||||||
 | 
					    int32_t numer, int32_t magic, uint8_t more);
 | 
				
			||||||
static LIBDIVIDE_INLINE int32_t libdivide_s32_do(
 | 
					static LIBDIVIDE_INLINE int32_t libdivide_s32_do(
 | 
				
			||||||
    int32_t numer, const struct libdivide_s32_t *denom);
 | 
					    int32_t numer, const struct libdivide_s32_t *denom);
 | 
				
			||||||
 | 
					static LIBDIVIDE_INLINE uint32_t libdivide_u32_do_raw(
 | 
				
			||||||
 | 
					    uint32_t numer, uint32_t magic, uint8_t more);
 | 
				
			||||||
static LIBDIVIDE_INLINE uint32_t libdivide_u32_do(
 | 
					static LIBDIVIDE_INLINE uint32_t libdivide_u32_do(
 | 
				
			||||||
    uint32_t numer, const struct libdivide_u32_t *denom);
 | 
					    uint32_t numer, const struct libdivide_u32_t *denom);
 | 
				
			||||||
 | 
					static LIBDIVIDE_INLINE int64_t libdivide_s64_do_raw(
 | 
				
			||||||
 | 
					    int64_t numer, int64_t magic, uint8_t more);
 | 
				
			||||||
static LIBDIVIDE_INLINE int64_t libdivide_s64_do(
 | 
					static LIBDIVIDE_INLINE int64_t libdivide_s64_do(
 | 
				
			||||||
    int64_t numer, const struct libdivide_s64_t *denom);
 | 
					    int64_t numer, const struct libdivide_s64_t *denom);
 | 
				
			||||||
 | 
					static LIBDIVIDE_INLINE uint64_t libdivide_u64_do_raw(
 | 
				
			||||||
 | 
					    uint64_t numer, uint64_t magic, uint8_t more);
 | 
				
			||||||
static LIBDIVIDE_INLINE uint64_t libdivide_u64_do(
 | 
					static LIBDIVIDE_INLINE uint64_t libdivide_u64_do(
 | 
				
			||||||
    uint64_t numer, const struct libdivide_u64_t *denom);
 | 
					    uint64_t numer, const struct libdivide_u64_t *denom);
 | 
				
			||||||
 | 
					
 | 
				
			||||||
| 
						 | 
					@ -315,7 +334,7 @@ static LIBDIVIDE_INLINE int32_t libdivide_mullhi_s32(int32_t x, int32_t y) {
 | 
				
			||||||
}
 | 
					}
 | 
				
			||||||
 | 
					
 | 
				
			||||||
static LIBDIVIDE_INLINE uint64_t libdivide_mullhi_u64(uint64_t x, uint64_t y) {
 | 
					static LIBDIVIDE_INLINE uint64_t libdivide_mullhi_u64(uint64_t x, uint64_t y) {
 | 
				
			||||||
#if defined(LIBDIVIDE_VC) && defined(LIBDIVIDE_X86_64)
 | 
					#if defined(LIBDIVIDE_X64_INTRINSICS)
 | 
				
			||||||
    return __umulh(x, y);
 | 
					    return __umulh(x, y);
 | 
				
			||||||
#elif defined(HAS_INT128_T)
 | 
					#elif defined(HAS_INT128_T)
 | 
				
			||||||
    __uint128_t xl = x, yl = y;
 | 
					    __uint128_t xl = x, yl = y;
 | 
				
			||||||
| 
						 | 
					@ -341,7 +360,7 @@ static LIBDIVIDE_INLINE uint64_t libdivide_mullhi_u64(uint64_t x, uint64_t y) {
 | 
				
			||||||
}
 | 
					}
 | 
				
			||||||
 | 
					
 | 
				
			||||||
static LIBDIVIDE_INLINE int64_t libdivide_mullhi_s64(int64_t x, int64_t y) {
 | 
					static LIBDIVIDE_INLINE int64_t libdivide_mullhi_s64(int64_t x, int64_t y) {
 | 
				
			||||||
#if defined(LIBDIVIDE_VC) && defined(LIBDIVIDE_X86_64)
 | 
					#if defined(LIBDIVIDE_X64_INTRINSICS)
 | 
				
			||||||
    return __mulh(x, y);
 | 
					    return __mulh(x, y);
 | 
				
			||||||
#elif defined(HAS_INT128_T)
 | 
					#elif defined(HAS_INT128_T)
 | 
				
			||||||
    __int128_t xl = x, yl = y;
 | 
					    __int128_t xl = x, yl = y;
 | 
				
			||||||
| 
						 | 
					@ -914,12 +933,11 @@ struct libdivide_u32_branchfree_t libdivide_u32_branchfree_gen(uint32_t d) {
 | 
				
			||||||
    return ret;
 | 
					    return ret;
 | 
				
			||||||
}
 | 
					}
 | 
				
			||||||
 | 
					
 | 
				
			||||||
uint32_t libdivide_u32_do(uint32_t numer, const struct libdivide_u32_t *denom) {
 | 
					uint32_t libdivide_u32_do_raw(uint32_t numer, uint32_t magic, uint8_t more) {
 | 
				
			||||||
    uint8_t more = denom->more;
 | 
					    if (!magic) {
 | 
				
			||||||
    if (!denom->magic) {
 | 
					 | 
				
			||||||
        return numer >> more;
 | 
					        return numer >> more;
 | 
				
			||||||
    } else {
 | 
					    } else {
 | 
				
			||||||
        uint32_t q = libdivide_mullhi_u32(denom->magic, numer);
 | 
					        uint32_t q = libdivide_mullhi_u32(magic, numer);
 | 
				
			||||||
        if (more & LIBDIVIDE_ADD_MARKER) {
 | 
					        if (more & LIBDIVIDE_ADD_MARKER) {
 | 
				
			||||||
            uint32_t t = ((numer - q) >> 1) + q;
 | 
					            uint32_t t = ((numer - q) >> 1) + q;
 | 
				
			||||||
            return t >> (more & LIBDIVIDE_32_SHIFT_MASK);
 | 
					            return t >> (more & LIBDIVIDE_32_SHIFT_MASK);
 | 
				
			||||||
| 
						 | 
					@ -931,6 +949,10 @@ uint32_t libdivide_u32_do(uint32_t numer, const struct libdivide_u32_t *denom) {
 | 
				
			||||||
    }
 | 
					    }
 | 
				
			||||||
}
 | 
					}
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					uint32_t libdivide_u32_do(uint32_t numer, const struct libdivide_u32_t *denom) {
 | 
				
			||||||
 | 
					    return libdivide_u32_do_raw(numer, denom->magic, denom->more);
 | 
				
			||||||
 | 
					}
 | 
				
			||||||
 | 
					
 | 
				
			||||||
uint32_t libdivide_u32_branchfree_do(
 | 
					uint32_t libdivide_u32_branchfree_do(
 | 
				
			||||||
    uint32_t numer, const struct libdivide_u32_branchfree_t *denom) {
 | 
					    uint32_t numer, const struct libdivide_u32_branchfree_t *denom) {
 | 
				
			||||||
    uint32_t q = libdivide_mullhi_u32(denom->magic, numer);
 | 
					    uint32_t q = libdivide_mullhi_u32(denom->magic, numer);
 | 
				
			||||||
| 
						 | 
					@ -1074,12 +1096,11 @@ struct libdivide_u64_branchfree_t libdivide_u64_branchfree_gen(uint64_t d) {
 | 
				
			||||||
    return ret;
 | 
					    return ret;
 | 
				
			||||||
}
 | 
					}
 | 
				
			||||||
 | 
					
 | 
				
			||||||
uint64_t libdivide_u64_do(uint64_t numer, const struct libdivide_u64_t *denom) {
 | 
					uint64_t libdivide_u64_do_raw(uint64_t numer, uint64_t magic, uint8_t more) {
 | 
				
			||||||
    uint8_t more = denom->more;
 | 
					   if (!magic) {
 | 
				
			||||||
    if (!denom->magic) {
 | 
					 | 
				
			||||||
        return numer >> more;
 | 
					        return numer >> more;
 | 
				
			||||||
    } else {
 | 
					    } else {
 | 
				
			||||||
        uint64_t q = libdivide_mullhi_u64(denom->magic, numer);
 | 
					        uint64_t q = libdivide_mullhi_u64(magic, numer);
 | 
				
			||||||
        if (more & LIBDIVIDE_ADD_MARKER) {
 | 
					        if (more & LIBDIVIDE_ADD_MARKER) {
 | 
				
			||||||
            uint64_t t = ((numer - q) >> 1) + q;
 | 
					            uint64_t t = ((numer - q) >> 1) + q;
 | 
				
			||||||
            return t >> (more & LIBDIVIDE_64_SHIFT_MASK);
 | 
					            return t >> (more & LIBDIVIDE_64_SHIFT_MASK);
 | 
				
			||||||
| 
						 | 
					@ -1091,6 +1112,10 @@ uint64_t libdivide_u64_do(uint64_t numer, const struct libdivide_u64_t *denom) {
 | 
				
			||||||
    }
 | 
					    }
 | 
				
			||||||
}
 | 
					}
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					uint64_t libdivide_u64_do(uint64_t numer, const struct libdivide_u64_t *denom) {
 | 
				
			||||||
 | 
					    return libdivide_u64_do_raw(numer, denom->magic, denom->more);
 | 
				
			||||||
 | 
					}
 | 
				
			||||||
 | 
					
 | 
				
			||||||
uint64_t libdivide_u64_branchfree_do(
 | 
					uint64_t libdivide_u64_branchfree_do(
 | 
				
			||||||
    uint64_t numer, const struct libdivide_u64_branchfree_t *denom) {
 | 
					    uint64_t numer, const struct libdivide_u64_branchfree_t *denom) {
 | 
				
			||||||
    uint64_t q = libdivide_mullhi_u64(denom->magic, numer);
 | 
					    uint64_t q = libdivide_mullhi_u64(denom->magic, numer);
 | 
				
			||||||
| 
						 | 
					@ -1430,11 +1455,10 @@ struct libdivide_s32_branchfree_t libdivide_s32_branchfree_gen(int32_t d) {
 | 
				
			||||||
    return result;
 | 
					    return result;
 | 
				
			||||||
}
 | 
					}
 | 
				
			||||||
 | 
					
 | 
				
			||||||
int32_t libdivide_s32_do(int32_t numer, const struct libdivide_s32_t *denom) {
 | 
					int32_t libdivide_s32_do_raw(int32_t numer, int32_t magic, uint8_t more) {
 | 
				
			||||||
    uint8_t more = denom->more;
 | 
					 | 
				
			||||||
    uint8_t shift = more & LIBDIVIDE_32_SHIFT_MASK;
 | 
					    uint8_t shift = more & LIBDIVIDE_32_SHIFT_MASK;
 | 
				
			||||||
 | 
					
 | 
				
			||||||
    if (!denom->magic) {
 | 
					    if (!magic) {
 | 
				
			||||||
        uint32_t sign = (int8_t)more >> 7;
 | 
					        uint32_t sign = (int8_t)more >> 7;
 | 
				
			||||||
        uint32_t mask = ((uint32_t)1 << shift) - 1;
 | 
					        uint32_t mask = ((uint32_t)1 << shift) - 1;
 | 
				
			||||||
        uint32_t uq = numer + ((numer >> 31) & mask);
 | 
					        uint32_t uq = numer + ((numer >> 31) & mask);
 | 
				
			||||||
| 
						 | 
					@ -1443,7 +1467,7 @@ int32_t libdivide_s32_do(int32_t numer, const struct libdivide_s32_t *denom) {
 | 
				
			||||||
        q = (q ^ sign) - sign;
 | 
					        q = (q ^ sign) - sign;
 | 
				
			||||||
        return q;
 | 
					        return q;
 | 
				
			||||||
    } else {
 | 
					    } else {
 | 
				
			||||||
        uint32_t uq = (uint32_t)libdivide_mullhi_s32(denom->magic, numer);
 | 
					        uint32_t uq = (uint32_t)libdivide_mullhi_s32(magic, numer);
 | 
				
			||||||
        if (more & LIBDIVIDE_ADD_MARKER) {
 | 
					        if (more & LIBDIVIDE_ADD_MARKER) {
 | 
				
			||||||
            // must be arithmetic shift and then sign extend
 | 
					            // must be arithmetic shift and then sign extend
 | 
				
			||||||
            int32_t sign = (int8_t)more >> 7;
 | 
					            int32_t sign = (int8_t)more >> 7;
 | 
				
			||||||
| 
						 | 
					@ -1458,6 +1482,10 @@ int32_t libdivide_s32_do(int32_t numer, const struct libdivide_s32_t *denom) {
 | 
				
			||||||
    }
 | 
					    }
 | 
				
			||||||
}
 | 
					}
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					int32_t libdivide_s32_do(int32_t numer, const struct libdivide_s32_t *denom) {
 | 
				
			||||||
 | 
					    return libdivide_s32_do_raw(numer, denom->magic, denom->more);
 | 
				
			||||||
 | 
					}
 | 
				
			||||||
 | 
					
 | 
				
			||||||
int32_t libdivide_s32_branchfree_do(int32_t numer, const struct libdivide_s32_branchfree_t *denom) {
 | 
					int32_t libdivide_s32_branchfree_do(int32_t numer, const struct libdivide_s32_branchfree_t *denom) {
 | 
				
			||||||
    uint8_t more = denom->more;
 | 
					    uint8_t more = denom->more;
 | 
				
			||||||
    uint8_t shift = more & LIBDIVIDE_32_SHIFT_MASK;
 | 
					    uint8_t shift = more & LIBDIVIDE_32_SHIFT_MASK;
 | 
				
			||||||
| 
						 | 
					@ -1599,11 +1627,10 @@ struct libdivide_s64_branchfree_t libdivide_s64_branchfree_gen(int64_t d) {
 | 
				
			||||||
    return ret;
 | 
					    return ret;
 | 
				
			||||||
}
 | 
					}
 | 
				
			||||||
 | 
					
 | 
				
			||||||
int64_t libdivide_s64_do(int64_t numer, const struct libdivide_s64_t *denom) {
 | 
					int64_t libdivide_s64_do_raw(int64_t numer, int64_t magic, uint8_t more) {
 | 
				
			||||||
    uint8_t more = denom->more;
 | 
					 | 
				
			||||||
    uint8_t shift = more & LIBDIVIDE_64_SHIFT_MASK;
 | 
					    uint8_t shift = more & LIBDIVIDE_64_SHIFT_MASK;
 | 
				
			||||||
 | 
					
 | 
				
			||||||
    if (!denom->magic) {  // shift path
 | 
					    if (!magic) {  // shift path
 | 
				
			||||||
        uint64_t mask = ((uint64_t)1 << shift) - 1;
 | 
					        uint64_t mask = ((uint64_t)1 << shift) - 1;
 | 
				
			||||||
        uint64_t uq = numer + ((numer >> 63) & mask);
 | 
					        uint64_t uq = numer + ((numer >> 63) & mask);
 | 
				
			||||||
        int64_t q = (int64_t)uq;
 | 
					        int64_t q = (int64_t)uq;
 | 
				
			||||||
| 
						 | 
					@ -1613,7 +1640,7 @@ int64_t libdivide_s64_do(int64_t numer, const struct libdivide_s64_t *denom) {
 | 
				
			||||||
        q = (q ^ sign) - sign;
 | 
					        q = (q ^ sign) - sign;
 | 
				
			||||||
        return q;
 | 
					        return q;
 | 
				
			||||||
    } else {
 | 
					    } else {
 | 
				
			||||||
        uint64_t uq = (uint64_t)libdivide_mullhi_s64(denom->magic, numer);
 | 
					        uint64_t uq = (uint64_t)libdivide_mullhi_s64(magic, numer);
 | 
				
			||||||
        if (more & LIBDIVIDE_ADD_MARKER) {
 | 
					        if (more & LIBDIVIDE_ADD_MARKER) {
 | 
				
			||||||
            // must be arithmetic shift and then sign extend
 | 
					            // must be arithmetic shift and then sign extend
 | 
				
			||||||
            int64_t sign = (int8_t)more >> 7;
 | 
					            int64_t sign = (int8_t)more >> 7;
 | 
				
			||||||
| 
						 | 
					@ -1628,6 +1655,10 @@ int64_t libdivide_s64_do(int64_t numer, const struct libdivide_s64_t *denom) {
 | 
				
			||||||
    }
 | 
					    }
 | 
				
			||||||
}
 | 
					}
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					int64_t libdivide_s64_do(int64_t numer, const struct libdivide_s64_t *denom) {
 | 
				
			||||||
 | 
					    return libdivide_s64_do_raw(numer, denom->magic, denom->more);
 | 
				
			||||||
 | 
					}
 | 
				
			||||||
 | 
					
 | 
				
			||||||
int64_t libdivide_s64_branchfree_do(int64_t numer, const struct libdivide_s64_branchfree_t *denom) {
 | 
					int64_t libdivide_s64_branchfree_do(int64_t numer, const struct libdivide_s64_branchfree_t *denom) {
 | 
				
			||||||
    uint8_t more = denom->more;
 | 
					    uint8_t more = denom->more;
 | 
				
			||||||
    uint8_t shift = more & LIBDIVIDE_64_SHIFT_MASK;
 | 
					    uint8_t shift = more & LIBDIVIDE_64_SHIFT_MASK;
 | 
				
			||||||
| 
						 | 
					
 | 
				
			||||||
							
								
								
									
										7
									
								
								util.h
									
										
									
									
									
								
							
							
						
						
									
										7
									
								
								util.h
									
										
									
									
									
								
							| 
						 | 
					@ -32,6 +32,13 @@
 | 
				
			||||||
#define STRINGIFY(s) #s
 | 
					#define STRINGIFY(s) #s
 | 
				
			||||||
#define ALIAS(f) __attribute__((alias(STRINGIFY(f))))
 | 
					#define ALIAS(f) __attribute__((alias(STRINGIFY(f))))
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					// supported since GCC 15
 | 
				
			||||||
 | 
					#if __has_attribute (nonstring)
 | 
				
			||||||
 | 
					#  define NONSTRING __attribute__ ((nonstring))
 | 
				
			||||||
 | 
					#else
 | 
				
			||||||
 | 
					#  define NONSTRING
 | 
				
			||||||
 | 
					#endif
 | 
				
			||||||
 | 
					
 | 
				
			||||||
typedef uint8_t u8;
 | 
					typedef uint8_t u8;
 | 
				
			||||||
typedef uint16_t u16;
 | 
					typedef uint16_t u16;
 | 
				
			||||||
typedef uint32_t u32;
 | 
					typedef uint32_t u32;
 | 
				
			||||||
| 
						 | 
					
 | 
				
			||||||
		Loading…
	
	Add table
		
		Reference in a new issue