update

lemire · lemire · commit 230cfa360064 · 2025-11-14T18:52:58.000-05:00
diff --git a/.travis.yml b/.travis.yml
diff --git a/CMakeLists.txt b/CMakeLists.txt
@@ -0,0 +1,108 @@
+cmake_minimum_required(VERSION 3.15)
+
+project(MaskedVByte VERSION 0.0.1 LANGUAGES C)
+
+include(GNUInstallDirs)
+include(CMakePackageConfigHelpers)
+include(CheckCCompilerFlag)
+
+option(MASKEDVBYTE_BUILD_EXAMPLES "Build examples" ON)
+option(MASKEDVBYTE_BUILD_TESTS "Build tests" ON)
+
+# Library
+add_library(maskedvbyte
+    src/varintdecode.c
+    src/varintencode.c
+)
+add_library(maskedvbyte::maskedvbyte ALIAS maskedvbyte)
+
+# Public headers
+set(MASKEDVBYTE_PUBLIC_HEADERS
+    include/varintdecode.h
+    include/varintencode.h
+)
+
+# Properties
+set_target_properties(maskedvbyte PROPERTIES
+    OUTPUT_NAME maskedvbyte
+    VERSION ${PROJECT_VERSION}
+    SOVERSION ${PROJECT_VERSION_MAJOR}
+    POSITION_INDEPENDENT_CODE ON
+)
+
+target_compile_features(maskedvbyte PUBLIC c_std_99)
+
+target_include_directories(maskedvbyte
+    PUBLIC
+        $<BUILD_INTERFACE:${CMAKE_CURRENT_SOURCE_DIR}/include>
+        $<INSTALL_INTERFACE:${CMAKE_INSTALL_INCLUDEDIR}>
+)
+
+# Enable SSE4.1 on GCC/Clang when available
+if (CMAKE_C_COMPILER_ID MATCHES "Clang|AppleClang|GNU")
+    check_c_compiler_flag("-msse4.1" HAS_SSE41_FLAG)
+    if (HAS_SSE41_FLAG)
+        target_compile_options(maskedvbyte PRIVATE -msse4.1)
+    endif()
+endif()
+
+# Examples
+if (MASKEDVBYTE_BUILD_EXAMPLES)
+    add_executable(example examples/example.c)
+    target_link_libraries(example PRIVATE maskedvbyte)
+    target_compile_features(example PRIVATE c_std_99)
+    target_include_directories(example PRIVATE ${CMAKE_CURRENT_SOURCE_DIR}/include)
+endif()
+
+# Tests
+if (MASKEDVBYTE_BUILD_TESTS)
+    include(CTest)
+    add_executable(unit tests/unit.c)
+    target_link_libraries(unit PRIVATE maskedvbyte)
+    target_compile_features(unit PRIVATE c_std_99)
+    target_include_directories(unit PRIVATE ${CMAKE_CURRENT_SOURCE_DIR}/include)
+    add_test(NAME maskedvbyte_unit COMMAND unit)
+endif()
+
+# Install rules
+install(TARGETS maskedvbyte
+    EXPORT maskedvbyteTargets
+    ARCHIVE DESTINATION ${CMAKE_INSTALL_LIBDIR}
+    LIBRARY DESTINATION ${CMAKE_INSTALL_LIBDIR}
+    RUNTIME DESTINATION ${CMAKE_INSTALL_BINDIR}
+    INCLUDES DESTINATION ${CMAKE_INSTALL_INCLUDEDIR}
+)
+
+install(FILES ${MASKEDVBYTE_PUBLIC_HEADERS}
+    DESTINATION ${CMAKE_INSTALL_INCLUDEDIR}
+)
+
+# Package config and export
+install(EXPORT maskedvbyteTargets
+    NAMESPACE maskedvbyte::
+    DESTINATION ${CMAKE_INSTALL_LIBDIR}/cmake/maskedvbyte
+)
+
+configure_package_config_file(
+    cmake/maskedvbyteConfig.cmake.in
+    ${CMAKE_CURRENT_BINARY_DIR}/maskedvbyteConfig.cmake
+    INSTALL_DESTINATION ${CMAKE_INSTALL_LIBDIR}/cmake/maskedvbyte
+)
+
+write_basic_package_version_file(
+    ${CMAKE_CURRENT_BINARY_DIR}/maskedvbyteConfigVersion.cmake
+    VERSION ${PROJECT_VERSION}
+    COMPATIBILITY SameMajorVersion
+)
+
+install(FILES
+    ${CMAKE_CURRENT_BINARY_DIR}/maskedvbyteConfig.cmake
+    ${CMAKE_CURRENT_BINARY_DIR}/maskedvbyteConfigVersion.cmake
+    DESTINATION ${CMAKE_INSTALL_LIBDIR}/cmake/maskedvbyte
+)
+
+# Export from build tree for convenience
+export(EXPORT maskedvbyteTargets
+    NAMESPACE maskedvbyte::
+    FILE ${CMAKE_CURRENT_BINARY_DIR}/maskedvbyteTargets.cmake
+)
diff --git a/Makefile b/Makefile
@@ -43,8 +43,8 @@ $(LIBNAME): $(OBJECTS)
 
 
 
-example: ./example.c    $(HEADERS) $(OBJECTS)
-	$(CC) $(CFLAGS) -o example ./example.c -Iinclude  $(OBJECTS)
+example: ./examples/example.c    $(HEADERS) $(OBJECTS)
+	$(CC) $(CFLAGS) -o example ./examples/example.c -Iinclude  $(OBJECTS)
 
 unit: ./tests/unit.c    $(HEADERS) $(OBJECTS)
 	$(CC) $(CFLAGS) -o unit ./tests/unit.c -Iinclude  $(OBJECTS)
diff --git a/README.md b/README.md
@@ -2,30 +2,98 @@ MaskedVByte
 ===========
 [![Ubuntu](https://github.com/fast-pack/MaskedVByte/actions/workflows/ubuntu.yml/badge.svg)](https://github.com/fast-pack/MaskedVByte/actions/workflows/ubuntu.yml)
 
-Fast decoder for VByte-compressed integers in C.
+Fast, vectorized VByte decoding for 32‑bit integers in C, with optional differential (delta) coding.
 
-It includes fast differential coding.
+- Requires x86-64 with SSE4.1 (available on virtually all modern x64 CPUs)
+- C99 compatible
+- Includes a tiny test and a runnable example
 
-We require x64 processors support SSE 4.1 or better. This includes virtually all x64 processors in service today, except for very old or specialized processors.
+Platform notes
+--------------
+- The library and tests build on Linux and macOS with a standard C toolchain.
+- The Makefile installs a shared object named `libmaskedvbyte.so` and uses `ldconfig`, which are Linux specific. On macOS, build and run targets work, but the `install` target is not applicable.
 
-The code should build using most standard-compliant modern C compilers (C99). The provided makefile
-expects a Linux-like system.
 
+Build and test
+--------------
 
-Usage:
+```sh
+make        # builds the library and the test binary
+./unit      # runs a quick correctness test
+```
 
-      make
-      ./unit 
+Build and run the example
+-------------------------
 
-See example.c for an example.
+```sh
+make example
+./example
+```
 
-Short code sample:
+You should see something like:
 
-```C
-size_t compsize = vbyte_encode(datain, N, compressedbuffer); // encoding
-// here the result is stored in compressedbuffer using compsize bytes
-size_t compsize2 = masked_vbyte_decode(compressedbuffer, recovdata, N); // decoding (fast)
 ```
+Compressed 5000 integers down to 5000 bytes.
+```
+
+Embedded example, explained
+---------------------------
+The example allocates input/output buffers, encodes a flat array of integers with classic VByte, then decodes it back with the masked (vectorized) decoder and verifies the sizes match.
+
+```c
+#include <stdio.h>
+#include <stdlib.h>
+#include <assert.h>
+
+#include "varintencode.h"
+#include "varintdecode.h"
+
+int main() {
+            int N = 5000;
+            uint32_t * datain = malloc(N * sizeof(uint32_t));
+            uint8_t * compressedbuffer = malloc(N * sizeof(uint32_t));
+            uint32_t * recovdata = malloc(N * sizeof(uint32_t));
+            for (int k = 0; k < N; ++k)
+                        datain[k] = 120; // constant value fits in one VByte
+            size_t compsize = vbyte_encode(datain, N, compressedbuffer); // encoding
+            // result is stored in 'compressedbuffer' using 'compsize' bytes
+            size_t compsize2 = masked_vbyte_decode(compressedbuffer, recovdata, N); // fast decoding
+            assert(compsize == compsize2); // sanity check
+            free(datain);
+            free(compressedbuffer);
+            free(recovdata);
+            printf("Compressed %d integers down to %d bytes.\n", N, (int)compsize);
+            return 0;
+}
+```
+
+What’s happening:
+- VByte uses a continuation bit; small values like 120 encode to a single byte, so 5000 values compress to 5000 bytes.
+- `masked_vbyte_decode` is a vectorized decoder using SSE4.1 for speed.
+- Differential coding variants are available when your data is sorted or has small gaps.
+
+API at a glance
+---------------
+Headers are in `include/`.
+
+- Encoding
+      - `size_t vbyte_encode(const uint32_t* in, size_t length, uint8_t* bout);`
+      - `size_t vbyte_encode_delta(const uint32_t* in, size_t length, uint8_t* bout, uint32_t prev);`
+
+- Decoding
+      - `size_t masked_vbyte_decode(const uint8_t* in, uint32_t* out, uint64_t length);`
+      - `size_t masked_vbyte_decode_delta(const uint8_t* in, uint32_t* out, uint64_t length, uint32_t prev);`
+      - `size_t masked_vbyte_decode_fromcompressedsize(const uint8_t* in, uint32_t* out, size_t inputsize);`
+      - `size_t masked_vbyte_decode_fromcompressedsize_delta(const uint8_t* in, uint32_t* out, size_t inputsize, uint32_t prev);`
+      - Random access helpers for delta streams:
+            - `uint32_t masked_vbyte_select_delta(const uint8_t *in, uint64_t length, uint32_t prev, size_t slot);`
+            - `int masked_vbyte_search_delta(const uint8_t *in, uint64_t length, uint32_t prev, uint32_t key, uint32_t *presult);`
+
+Tips
+----
+- Prefer delta coding when your sequence is sorted or has small differences; it often reduces the number of bytes per integer.
+- If you know the compressed byte length, use the `*_fromcompressedsize` functions to decode exactly that many bytes.
+
 
 Interesting applications 
 -----------------------
@@ -60,3 +128,8 @@ See also
 * Oroch is a C++ library that offers a usable API (MIT license) https://github.com/ademakov/Oroch
 
 
+License
+-------
+See `LICENSE` for details.
+
+
diff --git a/cmake/maskedvbyteConfig.cmake.in b/cmake/maskedvbyteConfig.cmake.in
@@ -0,0 +1,8 @@
+@PACKAGE_INIT@
+
+include(CMakeFindDependencyMacro)
+# Add find_dependency(...) here if the library gains external deps
+
+include("${CMAKE_CURRENT_LIST_DIR}/maskedvbyteTargets.cmake")
+
+check_required_components(maskedvbyte)
diff --git a/examples/example.c b/examples/example.c