summaryrefslogtreecommitdiff
path: root/deps/theft/theft.c
diff options
context:
space:
mode:
Diffstat (limited to 'deps/theft/theft.c')
-rw-r--r--deps/theft/theft.c496
1 files changed, 496 insertions, 0 deletions
diff --git a/deps/theft/theft.c b/deps/theft/theft.c
new file mode 100644
index 0000000..7c6244f
--- /dev/null
+++ b/deps/theft/theft.c
@@ -0,0 +1,496 @@
+#include <string.h>
+
+#include "theft.h"
+#include "theft_types_internal.h"
+#include "theft_bloom.h"
+#include "theft_mt.h"
+
+/* Initialize a theft test runner.
+ * BLOOM_BITS sets the size of the table used for detecting
+ * combinations of arguments that have already been tested.
+ * If 0, a default size will be chosen based on trial count.
+ * (This will only be used if all property types have hash
+ * callbacks defined.) The bloom filter can also be disabled
+ * by setting BLOOM_BITS to THEFT_BLOOM_DISABLE.
+ *
+ * Returns a NULL if malloc fails or BLOOM_BITS is out of bounds. */
+struct theft *theft_init(uint8_t bloom_bits) {
+ if ((bloom_bits != 0 && (bloom_bits < THEFT_BLOOM_BITS_MIN))
+ || ((bloom_bits > THEFT_BLOOM_BITS_MAX) &&
+ bloom_bits != THEFT_BLOOM_DISABLE)) {
+ return NULL;
+ }
+
+ theft *t = malloc(sizeof(*t));
+ if (t == NULL) { return NULL; }
+ memset(t, 0, sizeof(*t));
+
+ t->mt = theft_mt_init(DEFAULT_THEFT_SEED);
+ if (t->mt == NULL) {
+ free(t);
+ return NULL;
+ } else {
+ t->out = stdout;
+ t->requested_bloom_bits = bloom_bits;
+ return t;
+ }
+}
+
+/* (Re-)initialize the random number generator with a specific seed. */
+void theft_set_seed(struct theft *t, uint64_t seed) {
+ t->seed = seed;
+ theft_mt_reset(t->mt, seed);
+}
+
+/* Get a random 64-bit integer from the test runner's PRNG. */
+theft_seed theft_random(struct theft *t) {
+ theft_seed ns = (theft_seed)theft_mt_random(t->mt);
+ return ns;
+}
+
+/* Get a random double from the test runner's PRNG. */
+double theft_random_double(struct theft *t) {
+ return theft_mt_random_double(t->mt);
+}
+
+/* Change T's output stream handle to OUT. (Default: stdout.) */
+void theft_set_output_stream(struct theft *t, FILE *out) { t->out = out; }
+
+/* Check if all argument info structs have all required callbacks. */
+static bool
+check_all_args(struct theft_propfun_info *info, bool *all_hashable) {
+ bool ah = true;
+ for (int i = 0; i < info->arity; i++) {
+ struct theft_type_info *ti = info->type_info[i];
+ if (ti->alloc == NULL) { return false; }
+ if (ti->hash == NULL) { ah = false; }
+ }
+ *all_hashable = ah;
+ return true;
+}
+
+static theft_progress_callback_res
+default_progress_cb(struct theft_trial_info *info, void *env) {
+ (void)info;
+ (void)env;
+ return THEFT_PROGRESS_CONTINUE;
+}
+
+static void infer_arity(struct theft_propfun_info *info) {
+ for (int i = 0; i < THEFT_MAX_ARITY; i++) {
+ if (info->type_info[i] == NULL) {
+ info->arity = i;
+ break;
+ }
+ }
+}
+
+/* Run a series of randomized trials of a property function.
+ *
+ * Configuration is specified in CFG; many fields are optional.
+ * See the type definition in `theft_types.h`. */
+theft_run_res
+theft_run(struct theft *t, struct theft_cfg *cfg) {
+ if (t == NULL || cfg == NULL) {
+ return THEFT_RUN_ERROR_BAD_ARGS;
+ }
+
+ struct theft_propfun_info info;
+ memset(&info, 0, sizeof(info));
+ info.name = cfg->name;
+ info.fun = cfg->fun;
+ memcpy(info.type_info, cfg->type_info, sizeof(info.type_info));
+ info.always_seed_count = cfg->always_seed_count;
+ info.always_seeds = cfg->always_seeds;
+
+ if (cfg->seed) {
+ theft_set_seed(t, cfg->seed);
+ } else {
+ theft_set_seed(t, DEFAULT_THEFT_SEED);
+ }
+
+ if (cfg->trials == 0) { cfg->trials = THEFT_DEF_TRIALS; }
+
+ return theft_run_internal(t, &info, cfg->trials, cfg->progress_cb,
+ cfg->env, cfg->report);
+}
+
+/* Actually run the trials, with all arguments made explicit. */
+static theft_run_res
+theft_run_internal(struct theft *t, struct theft_propfun_info *info,
+ int trials, theft_progress_cb *cb, void *env,
+ struct theft_trial_report *r) {
+
+ struct theft_trial_report fake_report;
+ if (r == NULL) { r = &fake_report; }
+ memset(r, 0, sizeof(*r));
+
+ infer_arity(info);
+ if (info->arity == 0) {
+ return THEFT_RUN_ERROR_BAD_ARGS;
+ }
+
+ if (t == NULL || info == NULL || info->fun == NULL
+ || info->arity == 0) {
+ return THEFT_RUN_ERROR_BAD_ARGS;
+ }
+
+ bool all_hashable = false;
+ if (!check_all_args(info, &all_hashable)) {
+ return THEFT_RUN_ERROR_MISSING_CALLBACK;
+ }
+
+ if (cb == NULL) { cb = default_progress_cb; }
+
+ /* If all arguments are hashable, then attempt to use
+ * a bloom filter to avoid redundant checking. */
+ if (all_hashable) {
+ if (t->requested_bloom_bits == 0) {
+ t->requested_bloom_bits = theft_bloom_recommendation(trials);
+ }
+ if (t->requested_bloom_bits != THEFT_BLOOM_DISABLE) {
+ t->bloom = theft_bloom_init(t->requested_bloom_bits);
+ }
+ }
+
+ theft_seed seed = t->seed;
+ theft_seed initial_seed = t->seed;
+ int always_seeds = info->always_seed_count;
+ if (info->always_seeds == NULL) { always_seeds = 0; }
+
+ void *args[THEFT_MAX_ARITY];
+
+ theft_progress_callback_res cres = THEFT_PROGRESS_CONTINUE;
+
+ for (int trial = 0; trial < trials; trial++) {
+ memset(args, 0xFF, sizeof(args));
+ if (cres == THEFT_PROGRESS_HALT) { break; }
+
+ /* If any seeds to always run were specified, use those before
+ * reverting to the specified starting seed. */
+ if (trial < always_seeds) {
+ seed = info->always_seeds[trial];
+ } else if ((always_seeds > 0) && (trial == always_seeds)) {
+ seed = initial_seed;
+ }
+
+ struct theft_trial_info ti = {
+ .name = info->name,
+ .trial = trial,
+ .seed = seed,
+ .arity = info->arity,
+ .args = args
+ };
+
+ theft_set_seed(t, seed);
+ all_gen_res_t gres = gen_all_args(t, info, seed, args, env);
+ switch (gres) {
+ case ALL_GEN_SKIP:
+ /* skip generating these args */
+ ti.status = THEFT_TRIAL_SKIP;
+ r->skip++;
+ cres = cb(&ti, env);
+ break;
+ case ALL_GEN_DUP:
+ /* skip these args -- probably already tried */
+ ti.status = THEFT_TRIAL_DUP;
+ r->dup++;
+ cres = cb(&ti, env);
+ break;
+ default:
+ case ALL_GEN_ERROR:
+ /* Error while generating args */
+ ti.status = THEFT_TRIAL_ERROR;
+ cres = cb(&ti, env);
+ return THEFT_RUN_ERROR;
+ case ALL_GEN_OK:
+ /* (Extracted function to avoid deep nesting here.) */
+ if (!run_trial(t, info, args, cb, env, r, &ti, &cres)) {
+ return THEFT_RUN_ERROR;
+ }
+ }
+
+ free_args(info, args, env);
+
+ /* Restore last known seed and generate next. */
+ theft_set_seed(t, seed);
+ seed = theft_random(t);
+ }
+
+ if (r->fail > 0) {
+ return THEFT_RUN_FAIL;
+ } else {
+ return THEFT_RUN_PASS;
+ }
+}
+
+/* Now that arguments have been generated, run the trial and update
+ * counters, call cb with results, etc. */
+static bool run_trial(struct theft *t, struct theft_propfun_info *info,
+ void **args, theft_progress_cb *cb, void *env,
+ struct theft_trial_report *r, struct theft_trial_info *ti,
+ theft_progress_callback_res *cres) {
+ if (t->bloom) { mark_called(t, info, args, env); }
+ theft_trial_res tres = call_fun(info, args);
+ ti->status = tres;
+ switch (tres) {
+ case THEFT_TRIAL_PASS:
+ r->pass++;
+ *cres = cb(ti, env);
+ break;
+ case THEFT_TRIAL_FAIL:
+ if (!attempt_to_shrink(t, info, args, env)) {
+ ti->status = THEFT_TRIAL_ERROR;
+ *cres = cb(ti, env);
+ return false;
+ }
+ r->fail++;
+ *cres = report_on_failure(t, info, ti, cb, env);
+ break;
+ case THEFT_TRIAL_SKIP:
+ *cres = cb(ti, env);
+ r->skip++;
+ break;
+ case THEFT_TRIAL_DUP:
+ /* user callback should not return this; fall through */
+ case THEFT_TRIAL_ERROR:
+ *cres = cb(ti, env);
+ free_args(info, args, env);
+ return false;
+ }
+ return true;
+}
+
+static void free_args(struct theft_propfun_info *info,
+ void **args, void *env) {
+ for (int i = 0; i < info->arity; i++) {
+ theft_free_cb *fcb = info->type_info[i]->free;
+ if (fcb && args[i] != THEFT_SKIP) {
+ fcb(args[i], env);
+ }
+ }
+}
+
+void theft_free(struct theft *t) {
+ if (t->bloom) {
+ theft_bloom_dump(t->bloom);
+ theft_bloom_free(t->bloom);
+ t->bloom = NULL;
+ }
+ theft_mt_free(t->mt);
+ free(t);
+}
+
+/* Actually call the property function. Its number of arguments is not
+ * constrained by the typedef, but will be defined at the call site
+ * here. (If info->arity is wrong, it will probably crash.) */
+static theft_trial_res
+call_fun(struct theft_propfun_info *info, void **args) {
+ theft_trial_res res = THEFT_TRIAL_ERROR;
+ switch (info->arity) {
+ case 1:
+ res = info->fun(args[0]);
+ break;
+ case 2:
+ res = info->fun(args[0], args[1]);
+ break;
+ case 3:
+ res = info->fun(args[0], args[1], args[2]);
+ break;
+ case 4:
+ res = info->fun(args[0], args[1], args[2], args[3]);
+ break;
+ case 5:
+ res = info->fun(args[0], args[1], args[2], args[3], args[4]);
+ break;
+ case 6:
+ res = info->fun(args[0], args[1], args[2], args[3], args[4],
+ args[5]);
+ break;
+ case 7:
+ res = info->fun(args[0], args[1], args[2], args[3], args[4],
+ args[5], args[6]);
+ break;
+ case 8:
+ res = info->fun(args[0], args[1], args[2], args[3], args[4],
+ args[5], args[6], args[7]);
+ break;
+ case 9:
+ res = info->fun(args[0], args[1], args[2], args[3], args[4],
+ args[5], args[6], args[7], args[8]);
+ break;
+ case 10:
+ res = info->fun(args[0], args[1], args[2], args[3], args[4],
+ args[5], args[6], args[7], args[8], args[9]);
+ break;
+ /* ... */
+ default:
+ return THEFT_TRIAL_ERROR;
+ }
+ return res;
+}
+
+/* Attempt to instantiate arguments, starting with the current seed. */
+static all_gen_res_t
+gen_all_args(theft *t, struct theft_propfun_info *info,
+ theft_seed seed, void *args[THEFT_MAX_ARITY], void *env) {
+ for (int i = 0; i < info->arity; i++) {
+ struct theft_type_info *ti = info->type_info[i];
+ void *p = ti->alloc(t, seed, env);
+ if (p == THEFT_SKIP || p == THEFT_ERROR) {
+ for (int j = 0; j < i; j++) {
+ ti->free(args[j], env);
+ }
+ if (p == THEFT_SKIP) {
+ return ALL_GEN_SKIP;
+ } else {
+ return ALL_GEN_ERROR;
+ }
+ } else {
+ args[i] = p;
+ }
+ seed = theft_random(t);
+ }
+
+ /* check bloom filter */
+ if (t->bloom && check_called(t, info, args, env)) {
+ return ALL_GEN_DUP;
+ }
+
+ return ALL_GEN_OK;
+}
+
+/* Attempt to simplify all arguments, breadth first. Continue as long as
+ * progress is made, i.e., until a local minima is reached. */
+static bool
+attempt_to_shrink(theft *t, struct theft_propfun_info *info,
+ void *args[], void *env) {
+ bool progress = false;
+ do {
+ progress = false;
+ for (int ai = 0; ai < info->arity; ai++) {
+ struct theft_type_info *ti = info->type_info[ai];
+ if (ti->shrink) {
+ /* attempt to simplify this argument by one step */
+ shrink_res rres = attempt_to_shrink_arg(t, info, args, env, ai);
+ switch (rres) {
+ case SHRINK_OK:
+ progress = true;
+ break;
+ case SHRINK_DEAD_END:
+ break;
+ default:
+ case SHRINK_ERROR:
+ return false;
+ }
+ }
+ }
+ } while (progress);
+
+ return true;
+}
+
+/* Simplify an argument by trying all of its simplification tactics, in
+ * order, and checking whether the property still fails. If it passes,
+ * then revert the simplification and try another tactic.
+ *
+ * If the bloom filter is being used (i.e., if all arguments have hash
+ * callbacks defined), then use it to skip over areas of the state
+ * space that have probably already been tried. */
+static shrink_res
+attempt_to_shrink_arg(theft *t, struct theft_propfun_info *info,
+ void *args[], void *env, int ai) {
+ struct theft_type_info *ti = info->type_info[ai];
+
+ for (uint32_t tactic = 0; tactic < THEFT_MAX_TACTICS; tactic++) {
+ void *cur = args[ai];
+ void *nv = ti->shrink(cur, tactic, env);
+ if (nv == THEFT_NO_MORE_TACTICS) {
+ return SHRINK_DEAD_END;
+ } else if (nv == THEFT_ERROR) {
+ return SHRINK_ERROR;
+ } else if (nv == THEFT_DEAD_END) {
+ continue; /* try next tactic */
+ }
+
+ args[ai] = nv;
+ if (t->bloom) {
+ if (check_called(t, info, args, env)) {
+ /* probably redundant */
+ if (ti->free) { ti->free(nv, env); }
+ args[ai] = cur;
+ continue;
+ } else {
+ mark_called(t, info, args, env);
+ }
+ }
+ theft_trial_res res = call_fun(info, args);
+
+ switch (res) {
+ case THEFT_TRIAL_PASS:
+ case THEFT_TRIAL_SKIP:
+ /* revert */
+ args[ai] = cur;
+ if (ti->free) { ti->free(nv, env); }
+ break;
+ case THEFT_TRIAL_FAIL:
+ if (ti->free) { ti->free(cur, env); }
+ return SHRINK_OK;
+ case THEFT_TRIAL_DUP: /* user callback should not return this */
+ case THEFT_TRIAL_ERROR:
+ return SHRINK_ERROR;
+ }
+ }
+ (void)t;
+ return SHRINK_DEAD_END;
+}
+
+/* Populate a buffer with hashes of all the arguments. */
+static void get_arg_hash_buffer(theft_hash *buffer,
+ struct theft_propfun_info *info, void **args, void *env) {
+ for (int i = 0; i < info->arity; i++) {
+ buffer[i] = info->type_info[i]->hash(args[i], env);
+ }
+}
+
+/* Mark the tuple of argument instances as called in the bloom filter. */
+static void mark_called(theft *t, struct theft_propfun_info *info,
+ void **args, void *env) {
+ theft_hash buffer[THEFT_MAX_ARITY];
+ get_arg_hash_buffer(buffer, info, args, env);
+ theft_bloom_mark(t->bloom, (uint8_t *)buffer,
+ info->arity * sizeof(theft_hash));
+}
+
+/* Check if this combination of argument instances has been called. */
+static bool check_called(theft *t, struct theft_propfun_info *info,
+ void **args, void *env) {
+ theft_hash buffer[THEFT_MAX_ARITY];
+ get_arg_hash_buffer(buffer, info, args, env);
+ return theft_bloom_check(t->bloom, (uint8_t *)buffer,
+ info->arity * sizeof(theft_hash));
+}
+
+/* Print info about a failure. */
+static theft_progress_callback_res report_on_failure(theft *t,
+ struct theft_propfun_info *info,
+ struct theft_trial_info *ti, theft_progress_cb *cb, void *env) {
+ static theft_progress_callback_res cres;
+
+ int arity = info->arity;
+ fprintf(t->out, "\n\n -- Counter-Example: %s\n",
+ info->name ? info-> name : "");
+ fprintf(t->out, " Trial %u, Seed 0x%016llx\n", ti->trial,
+ (uint64_t)ti->seed);
+ for (int i = 0; i < arity; i++) {
+ theft_print_cb *print = info->type_info[i]->print;
+ if (print) {
+ fprintf(t->out, " Argument %d:\n", i);
+ print(t->out, ti->args[i], env);
+ fprintf(t->out, "\n");
+ }
+ }
+
+ cres = cb(ti, env);
+ return cres;
+}