Implemented proper scrolling

2025-03-06 20:48:25 +01:00 · 2023-04-28 18:04:53 +02:00 · 2023-04-28 18:04:53 +02:00 · 31885f6cd2
commit 31885f6cd2
parent 524d90e138
4 changed files with 82 additions and 2 deletions
--- a/2
+++ b/2
@ -1 +1 @@
-Subproject commit 59e75326813a2c73b94340892de55a16d8ee8d9a
+Subproject commit e820c00e723e6eac2a935ad7b5b91cee9446eb9d
--- a/example_config.txt
+++ b/example_config.txt
@ -21,3 +21,4 @@ pool_size 2
 threads 4
 timeout 120
 ctx_size 1012
 scroll_keep 20
--- a/explained_config.txt
+++ b/explained_config.txt
@ -0,0 +1,54 @@
 token MTA0MDYxMTQzNjUwNzk1OTMyNw.Gl_iMU.jVVM3bRqBJVi8ORVpWHquOivlASGJpRySt8qFg
 # The following parameters are set to their defaults here and can be ommited
 # Directory the models are located in. For example, see example_models/
 models_dir models
 # Language everything is translated to (will be disabled if set to "EN" anyways)
 language EN
 # Weather the bot should respond to pings outside threads
 threads_only true
 # Weather the bot should update messages periodically while writing them. Incompatible with translation
 live_edit false
 # Model to use outside threads
 default_inference_model 13b-vanilla
 # Model to be used for translation
 translation_model none
 # Few-shot prompt for non-instruct-mode. See example_prompt.txt
 prompt_file none
 # Prompt for instruct-mode. See example_instruct_prompt.txt
 instruct_prompt_file none
 # Amount of shards ("instances") of this bot. This is NOT Discord sharding
 shard_count 1
 # Number of this shard. Must be unique in the entire bot
 shard_id 0
 # Weather context ("chat histories") should persist restarts
 persistance true
 # Weather swapping should be prevented using mlock
 mlock false
 # Amount of contexts to keep in RAM at a time
 pool_size 2
 # Amount of CPU threads to use
 threads 4
 # Response/Evaluation timeout in seconds
 timeout 120
 # Max. context size
 ctx_size 1012
 # Percentage of context below prompt to be kept when scrolling. 0 means no context will be kept when scolling.
 scroll_keep 20
--- a/main.cpp
+++ b/main.cpp
@ -108,6 +108,7 @@ public:
                 pool_size = 2,
                 timeout = 120,
                 threads = 4,
                 scroll_keep = 20,
                 shard_cout = 1,
                 shard_id = 0;
        bool persistance = true,
@ -205,7 +206,9 @@ private:
        if (channel_cfg.instruct_mode && config.instruct_prompt_file == "none") return;
        std::ifstream f((*channel_cfg.model_name)+(channel_cfg.instruct_mode?"_instruct_init_cache":"_init_cache"), std::ios::binary);
        inference.deserialize(f);
        // Set params
        inference.params.n_ctx_window_top_bar = inference.get_context_size();
        inference.params.scroll_keep = float(config.scroll_keep) * 0.01f;
    }
    // Must run in llama thread
    LM::Inference &llm_start(dpp::snowflake id, const BotChannelConfig& channel_cfg) {
@ -219,12 +222,20 @@ private:
    // Must run in llama thread
    LM::Inference &llm_get_inference(dpp::snowflake id, const BotChannelConfig& channel_cfg) {
        ENSURE_LLM_THREAD();
        // Get inference
        auto inference_opt = llm_pool.get_inference(id);
        if (!inference_opt.has_value()) {
            // Start new inference
            inference_opt = llm_start(id, channel_cfg);
        }
-        return inference_opt.value();
+        auto& fres = inference_opt.value();
        // Set scroll callback
        fres.get().set_scroll_callback([msg = dpp::message(), channel_id = id] (float progress) {
            std::cout << "WARNING: " << channel_id << " is scrolling! " << progress << "% \r" << std::flush;
            return true;
        });
        // Return inference
        return fres;
    }
    // Must run in llama thread
@ -239,6 +250,12 @@ private:
            texts.timeout = llm_translate_from_en(texts.timeout);
            texts.translated = true;
        }
        // Set scroll callback
        auto scroll_cb = [] (float) {
            std::cerr << "Error: Prompt doesn't fit into max. context size!" << std::endl;
            abort();
            return false;
        };
        // Build init caches
        std::string filename;
        for (const auto& [model_name, model_config] : model_configs) {
@ -266,6 +283,7 @@ private:
                // Append
                using namespace fmt::literals;
                if (prompt.back() != '\n') prompt.push_back('\n');
                llm->set_scroll_callback(scroll_cb);
                llm->append(fmt::format(fmt::runtime(prompt), "bot_name"_a=bot.me.username), show_console_progress);
                // Serialize end result
                std::ofstream f(filename, std::ios::binary);
@ -294,6 +312,7 @@ private:
                // Append
                using namespace fmt::literals;
                if (prompt.back() != '\n') prompt.push_back('\n');
                llm->set_scroll_callback(scroll_cb);
                llm->append(fmt::format(fmt::runtime(prompt), "bot_name"_a=bot.me.username)+"\n\n"+model_config.user_prompt, show_console_progress);
                // Serialize end result
                std::ofstream f(filename, std::ios::binary);
@ -671,6 +690,8 @@ int main(int argc, char **argv) {
            cfg.pool_size = std::stoi(value);
        } else if (key == "threads") {
            cfg.threads = std::stoi(value);
        } else if (key == "scroll_keep") {
            cfg.scroll_keep = std::stoi(value);
        } else if (key == "shard_cout") {
            cfg.shard_cout = std::stoi(value);
        } else if (key == "shard_id") {
@ -789,6 +810,10 @@ int main(int argc, char **argv) {
            exit(-7);
        }
    }
    if (cfg.scroll_keep >= 99) {
        std::cerr << "Error: Scroll_keep must be a non-float percentage and in a range of 0-99." << std::endl;
        exit(-12);
    }
    // Construct and configure bot
    Bot bot(cfg, models);
		`@ -1 +1 @@`
			`Subproject commit 59e75326813a2c73b94340892de55a16d8ee8d9a`				`Subproject commit e820c00e723e6eac2a935ad7b5b91cee9446eb9d`