diff options
author | Toni Uhlig <matzeton@googlemail.com> | 2023-07-16 02:03:33 +0200 |
---|---|---|
committer | Toni Uhlig <matzeton@googlemail.com> | 2023-07-16 02:03:33 +0200 |
commit | 5a40295c4cf0af5ea8da9ced04a4ce7d3621a080 (patch) | |
tree | cb21506e7b04d10b45d6066a0ee1655563d5d52b /src/compiler/codegen_c_sort.c |
Squashed 'flatcc/' content from commit 473da2a
git-subtree-dir: flatcc
git-subtree-split: 473da2afa5ca435363f8c5e6569167aee6bc31c5
Diffstat (limited to 'src/compiler/codegen_c_sort.c')
-rw-r--r-- | src/compiler/codegen_c_sort.c | 171 |
1 files changed, 171 insertions, 0 deletions
diff --git a/src/compiler/codegen_c_sort.c b/src/compiler/codegen_c_sort.c new file mode 100644 index 0000000..4319f96 --- /dev/null +++ b/src/compiler/codegen_c_sort.c @@ -0,0 +1,171 @@ +#include "codegen_c_sort.h" + +/* + * We choose heapsort because it is about as fast as quicksort, avoids + * recursion, the code is compact which makes it practical to specialize for + * different vector types, it can sort the flatbuffer arrays in-place, + * and it has only a few places with comparisons. Furthermore, heapsort + * has worst case (n log n) upperbound where quicksort has O(n^2) which + * is an attack vector, and could be a problem with large datasets + * The sort is not stable. + * + * Some arguments are similar to those of the __%sfind_by_field macro. + * + * NS: The namespace + * N: the name of the vector type + * X: the name suffix when there are multiple sorts for same vector type. + * E: Element accessor (elem = E(vector, index)). + * L: Vector length. + * A: Field accessor (or the identity function), result must match the diff function D. + * TK: The scalar, enum or string key type, (either the element, or a field of the element). + * TE: The raw element type - uoffset_t for tables and strings. + * for swap. + * D: The diff function, but unlike __find_by_field, the second + * argument is returned by A, not a search key, and there is no third argument. + * S: Swap operation - must handle offset change when offset elements are moved. + */ + +int gen_sort(fb_output_t *out) +{ + fprintf(out->fp, + "#define __%sheap_sort(N, X, A, E, L, TK, TE, D, S)\\\n" + "static inline void __ ## N ## X ## __heap_sift_down(\\\n" + " N ## _mutable_vec_t vec__tmp, size_t start__tmp, size_t end__tmp)\\\n" + "{ size_t child__tmp, root__tmp; TK v1__tmp, v2__tmp, vroot__tmp;\\\n" + " root__tmp = start__tmp;\\\n" + " while ((root__tmp << 1) <= end__tmp) {\\\n" + " child__tmp = root__tmp << 1;\\\n" + " if (child__tmp < end__tmp) {\\\n" + " v1__tmp = A(E(vec__tmp, child__tmp));\\\n" + " v2__tmp = A(E(vec__tmp, child__tmp + 1));\\\n" + " if (D(v1__tmp, v2__tmp) < 0) {\\\n" + " child__tmp++;\\\n" + " }\\\n" + " }\\\n" + " vroot__tmp = A(E(vec__tmp, root__tmp));\\\n" + " v1__tmp = A(E(vec__tmp, child__tmp));\\\n" + " if (D(vroot__tmp, v1__tmp) < 0) {\\\n" + " S(vec__tmp, root__tmp, child__tmp, TE);\\\n" + " root__tmp = child__tmp;\\\n" + " } else {\\\n" + " return;\\\n" + " }\\\n" + " }\\\n" + "}\\\n" + "static inline void __ ## N ## X ## __heap_sort(N ## _mutable_vec_t vec__tmp)\\\n" + "{ size_t start__tmp, end__tmp, size__tmp;\\\n" + " size__tmp = L(vec__tmp); if (size__tmp == 0) return; end__tmp = size__tmp - 1; start__tmp = size__tmp >> 1;\\\n" + " do { __ ## N ## X ## __heap_sift_down(vec__tmp, start__tmp, end__tmp); } while (start__tmp--);\\\n" + " while (end__tmp > 0) { \\\n" + " S(vec__tmp, 0, end__tmp, TE);\\\n" + " __ ## N ## X ## __heap_sift_down(vec__tmp, 0, --end__tmp); } }\n", + out->nsc); + fprintf(out->fp, + "#define __%sdefine_sort_by_field(N, NK, TK, TE, D, S)\\\n" + " __%sheap_sort(N, _sort_by_ ## NK, N ## _ ## NK ## _get, N ## _vec_at, N ## _vec_len, TK, TE, D, S)\\\n" + "static inline void N ## _vec_sort_by_ ## NK(N ## _mutable_vec_t vec__tmp)\\\n" + "{ __ ## N ## _sort_by_ ## NK ## __heap_sort(vec__tmp); }\n", + out->nsc, out->nsc); + fprintf(out->fp, + "#define __%sdefine_sort(N, TK, TE, D, S)\\\n" + "__%sheap_sort(N, , __%sidentity, N ## _vec_at, N ## _vec_len, TK, TE, D, S)\\\n" + "static inline void N ## _vec_sort(N ## _mutable_vec_t vec__tmp) { __ ## N ## __heap_sort(vec__tmp); }\n", + out->nsc, out->nsc, out->nsc); + fprintf(out->fp, + /* Subtractions doesn't work for unsigned types. */ + "#define __%sscalar_diff(x, y) ((x) < (y) ? -1 : (x) > (y))\n" + "#define __%sstring_diff(x, y) __%sstring_n_cmp((x), (const char *)(y), %sstring_len(y))\n", + out->nsc, out->nsc, out->nsc, out->nsc); + fprintf(out->fp, + "#define __%svalue_swap(vec, a, b, TE) { TE x__tmp = vec[b]; vec[b] = vec[a]; vec[a] = x__tmp; }\n" + "#define __%suoffset_swap(vec, a, b, TE)\\\n" + "{ TE ta__tmp, tb__tmp, d__tmp;\\\n" + " d__tmp = (TE)((a - b) * sizeof(vec[0]));\\\n" + " ta__tmp = __flatbuffers_uoffset_read_from_pe(vec + b) - d__tmp;\\\n" + " tb__tmp = __flatbuffers_uoffset_read_from_pe(vec + a) + d__tmp;\\\n" + " __flatbuffers_uoffset_write_to_pe(vec + a, ta__tmp);\\\n" + " __flatbuffers_uoffset_write_to_pe(vec + b, tb__tmp); }\n", + out->nsc, out->nsc); + fprintf(out->fp, + "#define __%sscalar_swap(vec, a, b, TE) __%svalue_swap(vec, a, b, TE)\n", + out->nsc, out->nsc); + fprintf(out->fp, + "#define __%sstring_swap(vec, a, b, TE) __%suoffset_swap(vec, a, b, TE)\n", + out->nsc, out->nsc); + fprintf(out->fp, + "#define __%sstruct_swap(vec, a, b, TE) __%svalue_swap(vec, a, b, TE)\n", + out->nsc, out->nsc); + fprintf(out->fp, + "#define __%stable_swap(vec, a, b, TE) __%suoffset_swap(vec, a, b, TE)\n", + out->nsc, out->nsc); + fprintf(out->fp, + "#define __%sdefine_struct_sort_by_scalar_field(N, NK, TK, TE)\\\n" + " __%sdefine_sort_by_field(N, NK, TK, TE, __%sscalar_diff, __%sstruct_swap)\n", + out->nsc, out->nsc, out->nsc, out->nsc); + fprintf(out->fp, + "#define __%sdefine_table_sort_by_scalar_field(N, NK, TK)\\\n" + " __%sdefine_sort_by_field(N, NK, TK, %suoffset_t, __%sscalar_diff, __%stable_swap)\n", + out->nsc, out->nsc, out->nsc, out->nsc, out->nsc); + fprintf(out->fp, + "#define __%sdefine_table_sort_by_string_field(N, NK)\\\n" + " __%sdefine_sort_by_field(N, NK, %sstring_t, %suoffset_t, __%sstring_diff, __%stable_swap)\n", + out->nsc, out->nsc, out->nsc, out->nsc, out->nsc, out->nsc); + fprintf(out->fp, + "#define __%sdefine_scalar_sort(N, T) __%sdefine_sort(N, T, T, __%sscalar_diff, __%sscalar_swap)\n", + out->nsc, out->nsc, out->nsc, out->nsc); + fprintf(out->fp, + "#define __%sdefine_string_sort() __%sdefine_sort(%sstring, %sstring_t, %suoffset_t, __%sstring_diff, __%sstring_swap)\n", + out->nsc, out->nsc, out->nsc, out->nsc, out->nsc, out->nsc, out->nsc); + return 0; +} + +/* reference implementation */ +#if 0 + +/* from github swenson/sort */ +/* heap sort: based on wikipedia */ +static __inline void HEAP_SIFT_DOWN(SORT_TYPE *dst, const int64_t start, const int64_t end) { + int64_t root = start; + + while ((root << 1) <= end) { + int64_t child = root << 1; + + if ((child < end) && (SORT_CMP(dst[child], dst[child + 1]) < 0)) { + child++; + } + + if (SORT_CMP(dst[root], dst[child]) < 0) { + SORT_SWAP(dst[root], dst[child]); + root = child; + } else { + return; + } + } +} + +static __inline void HEAPIFY(SORT_TYPE *dst, const size_t size) { + int64_t start = size >> 1; + + while (start >= 0) { + HEAP_SIFT_DOWN(dst, start, size - 1); + start--; + } +} + +void HEAP_SORT(SORT_TYPE *dst, const size_t size) { + /* don't bother sorting an array of size 0 */ + if (size == 0) { + return; + } + + int64_t end = size - 1; + HEAPIFY(dst, size); + + while (end > 0) { + SORT_SWAP(dst[end], dst[0]); + HEAP_SIFT_DOWN(dst, 0, end - 1); + end--; + } +} + +#endif |