day1: part 1 complete

Fortune for aoc2021's current commit: Curse − 凶
3 years ago · 7598a8d6b9
parent a8dce41cc4
commit 7598a8d6b9
8 changed files with 63 additions and 145 deletions
--- a/3
+++ b/3
@ -0,0 +1,3 @@
 #TODO: How to lay this out?
 day%/: day%/day%-release
--- a/day1/Makefile
+++ b/day1/Makefile
@ -9,9 +9,13 @@ SRC_CXX = $(wildcard src/*.cpp)
 INCLUDE=include
 INPUT_SOURCE=input
 INPUT_DEST=src/input.c
 COMMON_FLAGS+= -W -Wall -fno-strict-aliasing $(addprefix -I,$(INCLUDE))
 COMMON_FLAGS+=-msse -msse2 -msse3
 COMMON_FLAGS+=-D_PART1
 OPT_FLAGS?= -march=native -fgraphite -fopenmp -floop-parallelize-all -ftree-parallelize-loops=4 \
 	    -floop-interchange -ftree-loop-distribution -floop-strip-mine -floop-block \
@ -53,16 +57,21 @@ OBJ = $(OBJ_C) $(OBJ_CXX)
 # Phonies
 .PHONY: release
-release: | dirs $(PROJECT)-release
+release: | dirs $(INPUT_DEST)
 	$(MAKE) $(PROJECT)-release
 .PHONY: debug
-debug: | dirs $(PROJECT)-debug
+debug: | dirs $(INPUT_DEST)
 	$(MAKE) $(PROJECT)-debug
 # Targets
 dirs:
 	@mkdir -p obj/c{,xx}/src
 $(INPUT_DEST): $(INPUT_SOURCE)
 	./mkinput $< > $@
 obj/c/%.o: %.c
 	$(CC) -c $< $(CFLAGS) -o $@ $(LDFLAGS)
@ -87,4 +96,5 @@ clean-rebuild:
 clean: clean-rebuild
 	rm -f $(PROJECT)-{release,debug,pgo}
 	rm -f $(INPUT_DEST)
--- a/day1/include/input.h
+++ b/day1/include/input.h
@ -10,11 +10,14 @@ extern "C" {
 typedef uint16_t input_t;
 #define INPUT_VECTOR_STEP (16 / sizeof(input_t))
 extern const size_t  INPUT_SIZE;
 extern const input_t INPUT[];
 struct ipair {
 	input_t prev;
 	input_t next;
 };
 #ifdef __cplusplus
 }
 #endif
--- a/day1/include/vector.h
+++ b/day1/include/vector.h
@ -1,71 +0,0 @@
 #ifndef _VECTOR_H
 #define _VECTOR_H
 #ifdef __cplusplus
 extern "C" {
 #endif
 #include <stdint.h>
 #include <mmintrin.h>
 #include <immintrin.h>
 #include <tmmintrin.h>
 #include <xmmintrin.h>
 #include <emmintrin.h>
 #define _VECTOR_SIZE 16
 // Vector128 int 8
 typedef uint8_t  v8_u128n __attribute__((vector_size(_VECTOR_SIZE)));
 typedef int8_t   v8_i128n __attribute__((vector_size(_VECTOR_SIZE)));
 // Vector128 int 16
 typedef uint16_t v16_u128n __attribute__((vector_size(_VECTOR_SIZE)));
 typedef int16_t  v16_i128n __attribute__((vector_size(_VECTOR_SIZE)));
 // Vector128 int 32 
 typedef uint32_t v32_u128n __attribute__((vector_size(_VECTOR_SIZE)));
 typedef int32_t  v32_i128n __attribute__((vector_size(_VECTOR_SIZE)));
 // Vector128 int 64
 typedef uint64_t v64_u128n __attribute__((vector_size(_VECTOR_SIZE)));
 typedef int64_t  v64_i128n __attribute__((vector_size(_VECTOR_SIZE)));
 typedef union v128 {
 	// Intrinsics
 	__m128i mm; // long int
 	__m128d mmd; // double
 	__m128  mmf; // float //XXX: Should we have the halfs
 	// Vectorised integers
 	union {
 		v8_u128n u8;
 		v8_i128n i8;
 		v16_u128n u16;
 		v16_i128n i16;
 		v32_u128n u32;
 		v32_i128n i32;
 		v64_u128n u64;
 		v64_i128n i64;
 	} as;
 	// Native 128 bit integers
 	unsigned __int128 u128;
 	signed   __int128  i128;
 	// Raw bytes
 	uint8_t bytes[_VECTOR_SIZE];
 } v128_t;
 #ifdef __cplusplus
 }
 static_assert(sizeof(union v128)==_VECTOR_SIZE, "invalid vector size");
 static_assert(alignof(union v128)==alignof(__m128i), "invalid vector alignment");
 #else
 _Static_assert(sizeof(union v128)==_VECTOR_SIZE, "invalid vector size");
 _Static_assert(_Alignof(union v128)==_Alignof(__m128i), "invalid vector alignment");
 #endif
 #endif /* _VECTOR_H */
--- a/day1/mkinput
+++ b/day1/mkinput
@ -1,6 +1,6 @@
 #!/bin/bash
-INPUT=${INPUT:-input}
+INPUT=${1:-input}
 NUM=$(wc -l < ${INPUT})
--- a/day1/src/main.c
+++ b/day1/src/main.c
@ -0,0 +1,24 @@
 #include <stdio.h>
 #include <input.h>
 extern int part1(uint64_t* restrict);
 extern int part2();
 int main()
 {
 	register int r=0;
 #ifdef _PART1
 	uint64_t p1;
 	if( (r = part1(&p1)) ) return r;
 #ifdef DEBUG
 	printf("[1] >>> %lu\n", p1);
 #else
 	printf("%lu\n", p1);
 #endif
 #endif
 #ifdef _PART2
 	if( (r = part2()) ) return r;
 #endif
 	return r;
 }
--- a/day1/src/p1.c
+++ b/day1/src/p1.c
@ -0,0 +1,18 @@
 #include <input.h>
 __attribute__((pure))
 uint64_t chk_pair(const struct ipair* restrict pair)
 {
 	return pair->prev < pair->next;
 }
 int part1(uint64_t* restrict _res)
 {
 	uint64_t res = 0;
 	for(size_t i=0;i<INPUT_SIZE-1;i++)
 	{
 		res += chk_pair((const struct ipair*)(INPUT+i));
 	}
 	*_res = res;
 	return 0;
 }
--- a/day1/src/vcomp.c
+++ b/day1/src/vcomp.c
@ -1,69 +0,0 @@
 #include <assert.h>
 #include <input.h>
 #include <vector.h>
 #include <tracem/ints.h>
 _Static_assert(sizeof(input_t)*INPUT_VECTOR_STEP == sizeof(v128_t), "invalid vector size mul");
 #define INPUT_VPROC_STEP 15
 __attribute__((pure))
 u64 vproc(usize len, const input_t input[const restrict len])
 {
 	static const v128_t SINGLE = { .as.i16 = { -1, -1, -1, -1, -1, -1, -1, -1 } };
 	static const v128_t ONES   = { .as.i16 = {  1,  1,  1,  1,  1,  1,  1,  1 } };
 #if DEBUG
 	assert(len % INPUT_VPROC_STEP == 0);
 #endif
 #define LAST(j) input[i +  (j)]
 #define NEXT(j) input[i + ((j) * 2)]
 	__m128i end = _mm_setzero_si128();
 	for(usize i = 0;i<len;i+=INPUT_VPROC_STEP)
 	{
 		// load the vectors
 		v128_t prev = { .as.u16 = {
 				input[i+0],
 				input[i+2],
 				input[i+4],
 				input[i+6],
 				input[i+8],
 				input[i+10],
 				input[i+12],
 				input[i+14],
 			}
 		};
 		v128_t next = { .as.u16 = {
 				input[i+1],
 				input[i+3],
 				input[i+5],
 				input[i+7],
 				input[i+9],
 				input[i+11],
 				input[i+13],
 				input[i+15],
 			}
 		};
 		//__m128i res = _mm_subs_epi16(prev.mm, next.mm);
 		__m128i pltn = _mm_cmplt_epi16(prev.mm, next.mm); // prev < next
 		pltn = _mm_sign_epi16(pltn, SINGLE.mm);
 		pltn = _mm_sign_epi16(ONES.mm, pltn);
 		end = _mm_add_epi16(end, pltn);
 		//__m128i pr =  _mm_sign_epi16(FULL_MASK.mm, res);
 	}
 	v16_u128n _ev = ((union v128)end).as.u16;
 	return (u64) (    _ev[0] + _ev[1] 
 			+ _ev[2] + _ev[3]
 			+ _ev[4] + _ev[5]
 			+ _ev[6] + _ev[7] );
 }
		`@ -0,0 +1,3 @@`

							`#TODO: How to lay this out?`
							`day%/: day%/day%-release`