Why Gemfury? Push, build, and install  RubyGems npm packages Python packages Maven artifacts PHP packages Go Modules Debian packages RPM packages NuGet packages

Repository URL to install this package:

Details    
Size: Mime:
#ifndef RAPIDFUZZ_CAPI_H
#define RAPIDFUZZ_CAPI_H

#ifdef __cplusplus
extern "C" {
#endif

#include "Python.h"

#include <stdbool.h>
#include <stddef.h>
#include <stdint.h>

/**
 * @brief string types
 */
enum RF_StringType {
    RF_UINT8,  /**< char type uint8_t */
    RF_UINT16, /**< char type uint16_t */
    RF_UINT32, /**< char type uint32_t */
    RF_UINT64  /**< char type uint64_t */
};

/**
 * @brief basic string type used for all strings in RapidFuzz
 */
typedef struct _RF_String {
    /**
     * @brief destructor for RF_String
     *
     * @param self pointer to RF_String instance to destruct
     */
    void (*dtor)(struct _RF_String* self);

    /* members */
    RF_StringType kind; /**< flag to specify string type stored in data */
    void* data;         /**< string data */
    int64_t length;     /**< string length */
    void* context;      /**< context which can be used to store addition information
                         * required for the string like e.g. a PyObject which needs
                         * to be decrefed in the destructor */
} RF_String;

/**
 * @brief convert python object to RF_String and preprocess it
 *
 * @param[in] obj Python object
 * @param[out] str Preprocessed String
 *
 * @return true on success and false with a Python exception set on failure
 */
typedef bool (*RF_Preprocess)(PyObject* obj, RF_String* str);

/**
 * @brief struct describing a Processor callback function.
 */
typedef struct {
#define PREPROCESSOR_STRUCT_VERSION ((uint32_t)1)
    uint32_t version;         /**< version number of the structure. Set to PREPROCESSOR_STRUCT_VERSION */
    RF_Preprocess preprocess; /**< function to preprocess string */
} RF_Preprocessor;

/**
 * @brief struct describing keyword arguments
 */
typedef struct _RF_Kwargs {
    /**
     * @brief destructor for RF_Kwargs
     *
     * @param self pointer to RF_Kwargs instance to destruct
     */
    void (*dtor)(struct _RF_Kwargs* self);

    /* members */
    void* context; /**< context used to store the keyword arguments */
} RF_Kwargs;

/**
 * @brief construct RF_Kwargs
 *
 * @param[out] self constructed RF_Kwargs instance
 * @param[in] kwargs Python dictionary holding keyword arguments
 *
 * @return true on success and false with a Python exception set on failure
 */
typedef bool (*RF_KwargsInit)(RF_Kwargs* self, PyObject* kwargs);

/**
 * @brief struct describing a Scorer
 */
typedef struct _RF_ScorerFunc {
    /**
     * @brief Destructor for RF_ScorerFunc
     *
     * @param self pointer to RF_ScorerFunc instance to destruct
     */
    void (*dtor)(struct _RF_ScorerFunc* self);

    /**
     * @brief Calculate edit distance
     *
     * @note has to be specified using RF_SCORER_FLAG_*:
     * - RF_SCORER_FLAG_RESULT_F64 -> call.f64
     * - RF_SCORER_FLAG_RESULT_I64 -> call.i64
     * - RF_SCORER_FLAG_RESULT_SIZE_T -> call.sizet
     *
     * @param[in] self pointer to RF_ScorerFunc instance
     * @param[in] str string to calculate distance with `strings` passed into `ctor`
     * @param[in] score_cutoff argument for a score threshold
     * @param[in] score_hint argument for an expected score to improve the performance
     * @param[out] result array of size `str_count` for results of the calculation
     *
     * @return true on success and false with a Python exception set on failure
     */
    union {
        bool (*f64)(const struct _RF_ScorerFunc* self, const RF_String* str, int64_t str_count,
                    double score_cutoff, double score_hint, double* result);
        bool (*i64)(const struct _RF_ScorerFunc* self, const RF_String* str, int64_t str_count,
                    int64_t score_cutoff, int64_t score_hint, int64_t* result);
        bool (*sizet)(const struct _RF_ScorerFunc* self, const RF_String* str, int64_t str_count,
                      size_t score_cutoff, size_t score_hint, size_t* result);
    } call;

    /* members */
    void* context; /**< context of the scorer */
} RF_ScorerFunc;

/**
 * @brief struct describing a Scorer
 */
typedef struct _RF_UncachedScorerFunc {
    union {
        bool (*f64)(const RF_String* str1, const RF_String* str2, const RF_Kwargs* kwargs,
                    double score_cutoff, double score_hint, double* result);
        bool (*i64)(const RF_String* str1, const RF_String* str2, const RF_Kwargs* kwargs,
                    int64_t score_cutoff, int64_t score_hint, int64_t* result);
        bool (*sizet)(const RF_String* str1, const RF_String* str2, const RF_Kwargs* kwargs,
                      size_t score_cutoff, size_t score_hint, size_t* result);
    } call;
} RF_UncachedScorerFunc;

/**
 * @brief construct RF_ScorerFunc.
 *
 * @param[out] self constructed RF_ScorerFunc instance
 * @param[in] kwargs keyword arguments for additional parameters
 * @param[in] str_count size of the strings array can only be != 1 if
 *                      RF_SCORER_FLAG_MULTI_STRING is set
 * @param[in] strings array of strings to compare in distance function
 *
 * @return true on success and false with a Python exception set on failure
 */
typedef bool (*RF_ScorerFuncInit)(RF_ScorerFunc* self, const RF_Kwargs* kwargs, int64_t str_count,
                                  const RF_String* strings);

/* RF_ScorerFuncInit supports str_count != 1.
 * This is useful for scorers which have SIMD support
 */
#define RF_SCORER_FLAG_MULTI_STRING_INIT ((uint32_t)1 << 0)

/* RF_ScorerFunc::call can be called with str_count != 1
 * This is useful for scorers which have SIMD support
 */
#define RF_SCORER_FLAG_MULTI_STRING_CALL ((uint32_t)1 << 1)

/* scorer returns result as double */
#define RF_SCORER_FLAG_RESULT_F64 ((uint32_t)1 << 5)

/* scorer returns result as int64_t */
#define RF_SCORER_FLAG_RESULT_I64 ((uint32_t)1 << 6)

/* scorer returns result as size_t */
#define RF_SCORER_FLAG_RESULT_SIZE_T ((uint32_t)1 << 7)

/* scorer is symmetric: scorer(a, b) == scorer(b, a) */
#define RF_SCORER_FLAG_SYMMETRIC ((uint32_t)1 << 11)

/* scorer adheres to triangle inequality: scorer(a,b) <= scorer(a,c) + scorer(b,c)
 * Implies that the scorer is symmetric
 */
#define RF_SCORER_FLAG_TRIANGLE_INEQUALITY ((uint32_t)1 << 12 | RF_SCORER_FLAG_SYMMETRIC)

/* when none is passed this is the worst score */
#define RF_SCORER_NONE_IS_WORST_SCORE ((uint32_t)1 << 13)

/**
 * @brief information associated with a scorer
 */
typedef struct _RF_ScorerFlags {
    /**
     * @brief flags of the scorer
     */
    uint32_t flags;
    /**
     * @brief optimal score which can be achieved.
     */
    union {
        double f64;
        int64_t i64;
        size_t sizet;
    } optimal_score;

    /**
     * @brief worst score which can be achieved.
     */
    union {
        double f64;
        int64_t i64;
        size_t sizet;
    } worst_score;
} RF_ScorerFlags;

/**
 * @brief retrieve flags associated with the scorer
 *
 * @param[in] kwargs keyword arguments of the scorer
 * @param[out] scorer_flags Scorer Flags associated with the scorer
 *
 * @return true on success and false with a Python exception set on failure
 */
typedef bool (*RF_GetScorerFlags)(const RF_Kwargs* kwargs, RF_ScorerFlags* scorer_flags);

/**
 * @brief struct describing a Scorer callback function.
 */
typedef struct {
#define SCORER_STRUCT_VERSION ((uint32_t)3)
    uint32_t version;                   /**< version number of the structure. Set to SCORER_STRUCT_VERSION */
    RF_KwargsInit kwargs_init;          /**< keyword argument constructor */
    RF_GetScorerFlags get_scorer_flags; /**< function to retrieve additional information about the scorer */
    RF_ScorerFuncInit scorer_func_init; /**< scorer constructor */
    RF_UncachedScorerFunc uncached_scorer_func; /**< uncached scorer */
} RF_Scorer;

#ifdef __cplusplus
}
#endif

#endif /* RAPIDFUZZ_CAPI_H */