#pragma once #include #include #include extern "C" { typedef bool (*token_callback)(const char *token); } int run_inference(gpt_params params, token_callback on_token);