mirror of
https://github.com/BLAKE3-team/BLAKE3
synced 2024-09-19 14:22:30 +02:00
d91f20dd29
Wire up basic functions and features for SSE2 support using the SSE4.1 version as a basis without implementing the SSE2 instructions yet. * Cargo.toml: add no_sse2 feature * benches/bench.rs: wire SSE2 benchmarks * build.rs: add SSE2 rust intrinsics and assembly builds * c/Makefile.testing: add SSE2 C and assembly targets * c/README.md: add SSE2 to C build instructions * c/blake3_c_rust_bindings/build.rs: add SSE2 C rust binding builds * c/blake3_c_rust_bindings/src/lib.rs: add SSE2 C rust bindings * c/blake3_dispatch.c: add SSE2 C dispatch * c/blake3_impl.h: add SSE2 C function prototypes * c/blake3_sse2.c: add SSE2 C intrinsic file starting with SSE4.1 version * c/blake3_sse2_x86-64_{unix.S,windows_gnu.S,windows_msvc.asm}: add SSE2 assembly files starting with SSE4.1 version * src/ffi_sse2.rs: add rust implementation using SSE2 C rust bindings * src/lib.rs: add SSE2 rust intrinsics and SSE2 C rust binding rust SSE2 module configurations * src/platform.rs: add SSE2 rust platform detection and dispatch * src/rust_sse2.rs: add SSE2 rust intrinsic file starting with SSE4.1 version * tools/instruction_set_support/src/main.rs: add SSE2 feature detection
76 lines
1.8 KiB
Makefile
76 lines
1.8 KiB
Makefile
# This Makefile is only for testing. C callers should follow the instructions
|
|
# in ./README.md to incorporate these C files into their existing build.
|
|
|
|
NAME=blake3
|
|
CC=gcc
|
|
CFLAGS=-O3 -Wall -Wextra -std=c11 -pedantic -fstack-protector-strong -D_FORTIFY_SOURCE=2 -fPIE -fvisibility=hidden
|
|
LDFLAGS=-pie -Wl,-z,relro,-z,now
|
|
TARGETS=
|
|
ASM_TARGETS=
|
|
EXTRAFLAGS=-Wa,--noexecstack
|
|
|
|
ifdef BLAKE3_NO_SSE2
|
|
EXTRAFLAGS += -DBLAKE3_NO_SSE2
|
|
else
|
|
TARGETS += blake3_sse2.o
|
|
ASM_TARGETS += blake3_sse2_x86-64_unix.S
|
|
endif
|
|
|
|
ifdef BLAKE3_NO_SSE41
|
|
EXTRAFLAGS += -DBLAKE3_NO_SSE41
|
|
else
|
|
TARGETS += blake3_sse41.o
|
|
ASM_TARGETS += blake3_sse41_x86-64_unix.S
|
|
endif
|
|
|
|
ifdef BLAKE3_NO_AVX2
|
|
EXTRAFLAGS += -DBLAKE3_NO_AVX2
|
|
else
|
|
TARGETS += blake3_avx2.o
|
|
ASM_TARGETS += blake3_avx2_x86-64_unix.S
|
|
endif
|
|
|
|
ifdef BLAKE3_NO_AVX512
|
|
EXTRAFLAGS += -DBLAKE3_NO_AVX512
|
|
else
|
|
TARGETS += blake3_avx512.o
|
|
ASM_TARGETS += blake3_avx512_x86-64_unix.S
|
|
endif
|
|
|
|
ifdef BLAKE3_USE_NEON
|
|
EXTRAFLAGS += -DBLAKE3_USE_NEON
|
|
TARGETS += blake3_neon.o
|
|
endif
|
|
|
|
all: blake3.c blake3_dispatch.c blake3_portable.c main.c $(TARGETS)
|
|
$(CC) $(CFLAGS) $(EXTRAFLAGS) $^ -o $(NAME) $(LDFLAGS)
|
|
|
|
blake3_sse2.o: blake3_sse2.c
|
|
$(CC) $(CFLAGS) $(EXTRAFLAGS) -c $^ -o $@ -msse2
|
|
|
|
blake3_sse41.o: blake3_sse41.c
|
|
$(CC) $(CFLAGS) $(EXTRAFLAGS) -c $^ -o $@ -msse4.1
|
|
|
|
blake3_avx2.o: blake3_avx2.c
|
|
$(CC) $(CFLAGS) $(EXTRAFLAGS) -c $^ -o $@ -mavx2
|
|
|
|
blake3_avx512.o: blake3_avx512.c
|
|
$(CC) $(CFLAGS) $(EXTRAFLAGS) -c $^ -o $@ -mavx512f -mavx512vl
|
|
|
|
blake3_neon.o: blake3_neon.c
|
|
$(CC) $(CFLAGS) $(EXTRAFLAGS) -c $^ -o $@
|
|
|
|
test: CFLAGS += -DBLAKE3_TESTING -fsanitize=address,undefined
|
|
test: all
|
|
./test.py
|
|
|
|
asm: blake3.c blake3_dispatch.c blake3_portable.c main.c $(ASM_TARGETS)
|
|
$(CC) $(CFLAGS) $(EXTRAFLAGS) $^ -o $(NAME) $(LDFLAGS)
|
|
|
|
test_asm: CFLAGS += -DBLAKE3_TESTING -fsanitize=address,undefined
|
|
test_asm: asm
|
|
./test.py
|
|
|
|
clean:
|
|
rm -f $(NAME) *.o
|