added insertion sort and regression test

This commit is contained in:
Ahmet Inan 2024-03-05 11:46:33 +01:00
commit ae0a749d08
2 changed files with 70 additions and 101 deletions

119
sort.hh
View file

@ -6,107 +6,32 @@ Copyright 2024 Ahmet Inan <inan@aicodix.de>
#pragma once
#include <algorithm>
template <int WIDTH>
static inline SIMD<uint32_t, WIDTH> vorder(SIMD<float, WIDTH> a)
template <typename TYPE, int WIDTH>
static inline SIMD<typename SIMD<TYPE, WIDTH>::uint_type, WIDTH> vorder(SIMD<TYPE, WIDTH> a)
{
SIMD<uint32_t, WIDTH> tmp;
for (int i = 0; i < WIDTH; ++i)
tmp.v[i] = i;
std::stable_sort(tmp.v, tmp.v+WIDTH, [a](int i, int j){ return a.v[i] < a.v[j]; });
return tmp;
SIMD<typename SIMD<TYPE, WIDTH>::uint_type, WIDTH> p;
p.v[0] = 0;
for (int i = 1, j; i < WIDTH; ++i) {
TYPE t = a.v[i];
for (j = i; j > 0 && a.v[j-1] > t; --j) {
a.v[j] = a.v[j-1];
p.v[j] = p.v[j-1];
}
a.v[j] = t;
p.v[j] = i;
}
return p;
}
template <int WIDTH>
static inline SIMD<uint64_t, WIDTH> vorder(SIMD<double, WIDTH> a)
template <typename TYPE, int WIDTH>
static inline SIMD<TYPE, WIDTH> vsort(SIMD<TYPE, WIDTH> a)
{
SIMD<uint64_t, WIDTH> tmp;
for (int i = 0; i < WIDTH; ++i)
tmp.v[i] = i;
std::stable_sort(tmp.v, tmp.v+WIDTH, [a](int i, int j){ return a.v[i] < a.v[j]; });
return tmp;
}
template <int WIDTH>
static inline SIMD<uint8_t, WIDTH> vorder(SIMD<int8_t, WIDTH> a)
{
SIMD<uint8_t, WIDTH> tmp;
for (int i = 0; i < WIDTH; ++i)
tmp.v[i] = i;
std::stable_sort(tmp.v, tmp.v+WIDTH, [a](int i, int j){ return a.v[i] < a.v[j]; });
return tmp;
}
template <int WIDTH>
static inline SIMD<uint16_t, WIDTH> vorder(SIMD<int16_t, WIDTH> a)
{
SIMD<uint16_t, WIDTH> tmp;
for (int i = 0; i < WIDTH; ++i)
tmp.v[i] = i;
std::stable_sort(tmp.v, tmp.v+WIDTH, [a](int i, int j){ return a.v[i] < a.v[j]; });
return tmp;
}
template <int WIDTH>
static inline SIMD<uint32_t, WIDTH> vorder(SIMD<int32_t, WIDTH> a)
{
SIMD<uint32_t, WIDTH> tmp;
for (int i = 0; i < WIDTH; ++i)
tmp.v[i] = i;
std::stable_sort(tmp.v, tmp.v+WIDTH, [a](int i, int j){ return a.v[i] < a.v[j]; });
return tmp;
}
template <int WIDTH>
static inline SIMD<uint64_t, WIDTH> vorder(SIMD<int64_t, WIDTH> a)
{
SIMD<uint64_t, WIDTH> tmp;
for (int i = 0; i < WIDTH; ++i)
tmp.v[i] = i;
std::stable_sort(tmp.v, tmp.v+WIDTH, [a](int i, int j){ return a.v[i] < a.v[j]; });
return tmp;
}
template <int WIDTH>
static inline SIMD<float, WIDTH> vsort(SIMD<float, WIDTH> a)
{
std::sort(a.v, a.v+WIDTH);
return a;
}
template <int WIDTH>
static inline SIMD<double, WIDTH> vsort(SIMD<double, WIDTH> a)
{
std::sort(a.v, a.v+WIDTH);
return a;
}
template <int WIDTH>
static inline SIMD<int8_t, WIDTH> vsort(SIMD<int8_t, WIDTH> a)
{
std::sort(a.v, a.v+WIDTH);
return a;
}
template <int WIDTH>
static inline SIMD<int16_t, WIDTH> vsort(SIMD<int16_t, WIDTH> a)
{
std::sort(a.v, a.v+WIDTH);
return a;
}
template <int WIDTH>
static inline SIMD<int32_t, WIDTH> vsort(SIMD<int32_t, WIDTH> a)
{
std::sort(a.v, a.v+WIDTH);
return a;
}
template <int WIDTH>
static inline SIMD<int64_t, WIDTH> vsort(SIMD<int64_t, WIDTH> a)
{
std::sort(a.v, a.v+WIDTH);
for (int i = 1, j; i < WIDTH; ++i) {
TYPE t = a.v[i];
for (j = i; j > 0 && a.v[j-1] > t; --j)
a.v[j] = a.v[j-1];
a.v[j] = t;
}
return a;
}