added custom bawialniagpt model and removed bielik

DuckyBlender · May 14, 2024 · 3905b1d · 3905b1d
1 parent 730ec9f
commit 3905b1d
Show file tree

Hide file tree

Showing 5 changed files with 262 additions and 73 deletions.
diff --git a/Cargo.toml b/Cargo.toml
@@ -23,7 +23,6 @@ enum-iterator = "2.1"
 ollama-rs = { version = "0.1.9", features = ["stream"] }
 tokio-stream = "0.1.15"
 image = "0.25.1"
-lazy_static = "1.4.0"
 aws-config = { version = "1.3", features = ["behavior-version-latest"] }
 aws-sdk-bedrockruntime = "1.24"
 # indicatif = "0.17.8"
diff --git a/src/commands/ollama.rs b/src/commands/ollama.rs
@@ -12,7 +12,6 @@ use teloxide::{
 use tokio_stream::StreamExt;
 
 use crate::models::ModelType;
-use crate::CURRENT_TASKS;
 
 pub const INTERVAL_SEC: u64 = 5;
 
@@ -95,25 +94,11 @@ pub async fn ollama(
 
     // Send a message to the chat to show that the bot is generating a response
     let generating_message = bot
-        .send_message(
-            msg.chat.id,
-            format!(
-                "Generating response...{}",
-                if CURRENT_TASKS.lock().await.len() >= 1 {
-                    format!(" (queue: {})", CURRENT_TASKS.lock().await.len())
-                } else {
-                    "".to_string()
-                }
-            ),
-        )
+        .send_message(msg.chat.id, "Generating response...".to_string())
         .reply_to_message_id(msg.id)
         .disable_notification(true)
         .await?;
 
-    let mut tasks = CURRENT_TASKS.lock().await;
-    tasks.push(generating_message.id);
-    drop(tasks);
-
     // Send typing indicator
     bot.send_chat_action(msg.chat.id, ChatAction::Typing)
         .await?;
@@ -217,10 +202,6 @@ pub async fn ollama(
     }
 
     info!("Final response received");
-    let mut tasks = CURRENT_TASKS.lock().await;
-    if let Some(index) = tasks.iter().position(|x| *x == generating_message.id) {
-        tasks.remove(index);
-    }
 
     if entire_response.is_empty() {
         warn!("No response received!");

diff --git a/src/commands/summarize.rs b/src/commands/summarize.rs
@@ -0,0 +1,221 @@
+// /summarize command - summarizes a youtube video or given text.
+
+use log::{error, info, warn};
+use ollama_rs::generation::completion::request::GenerationRequest;
+use ollama_rs::Ollama;
+use serde::Serialize;
+use teloxide::payloads::SendMessageSetters;
+use teloxide::{
+    requests::Requester,
+    types::{ChatAction, Message},
+    Bot, RequestError,
+};
+use tokio_stream::StreamExt;
+use youtube_transcript::{Transcript, Youtube, YoutubeBuilder};
+
+use crate::commands::ollama::INTERVAL_SEC;
+use crate::ModelType;
+
+pub async fn summarize(
+    bot: Bot,
+    msg: Message,
+    prompt: Option<String>,
+    ollama_client: Ollama,
+) -> Result<(), RequestError> {
+    // Check if the prompt is a youtube video or text
+    let prompt = match prompt {
+        Some(prompt) => prompt,
+        None => {
+            // If it's not in the prompt, check the reply
+            if let Some(reply) = msg.reply_to_message() {
+                if let Some(text) = reply.text() {
+                    text.to_string()
+                } else {
+                    let bot_msg = bot
+                        .send_message(msg.chat.id, "No prompt provided")
+                        .reply_to_message_id(msg.id)
+                        .await?;
+
+                    // Wait 5 seconds
+                    tokio::time::sleep(std::time::Duration::from_secs(5)).await;
+
+                    // Deleting the messages
+                    bot.delete_message(msg.chat.id, msg.id).await?;
+                    bot.delete_message(bot_msg.chat.id, bot_msg.id).await?;
+                    return Ok(());
+                }
+            } else {
+                let bot_msg = bot
+                    .send_message(msg.chat.id, "No prompt provided")
+                    .reply_to_message_id(msg.id)
+                    .await?;
+
+                // Wait 5 seconds
+                tokio::time::sleep(std::time::Duration::from_secs(5)).await;
+
+                // Deleting the messages
+                bot.delete_message(msg.chat.id, msg.id).await?;
+                bot.delete_message(bot_msg.chat.id, bot_msg.id).await?;
+                return Ok(());
+            }
+        }
+    };
+
+    // check if the prompt is a youtube video or text. it can also be a shortened youtube link
+    // https://www.youtube.com/watch?v=w0VMkE1toYg OR https://youtu.be/w0VMkE1toYg
+    let youtube_regex = regex::Regex::new(r"https://www.youtube.com/watch\?v=(?P<id>[a-zA-Z0-9_-]{11})|https://youtu.be/(?P<id2>[a-zA-Z0-9_-]{11})").unwrap();
+
+    let is_youtube = youtube_regex.is_match(&prompt);
+    let generating_message = if is_youtube {
+        // If it's a youtube video, use the youtube-transcript library and the summarization model
+        bot.send_message(msg.chat.id, "Summarizing youtube video...")
+            .reply_to_message_id(msg.id)
+            .await?
+    } else {
+        // If it's text, use the summarization model
+        bot.send_message(msg.chat.id, "Summarizing text...")
+            .reply_to_message_id(msg.id)
+            .await?
+    };
+
+    info!("Starting summarization command");
+
+    // Send typing indicator
+    bot.send_chat_action(msg.chat.id, ChatAction::Typing)
+        .await?;
+
+    // Download the youtube video and get the transcript
+
+    let text = if is_youtube {
+        // Get the youtube video id
+        let link: &str = prompt.as_str();
+        let youtube_loader = YoutubeBuilder::default();
+        let youtube_loader = youtube_loader.build();
+        let transcript = youtube_loader.transcript(link).await;
+        if let Ok(transcript) = transcript {
+            let mut text = String::new();
+            for t in transcript.transcripts {
+                text.push_str(&t.text);
+            }
+
+            text
+        } else {
+            let bot_msg = bot
+                .send_message(msg.chat.id, "Error: Could not get the transcript")
+                .reply_to_message_id(msg.id)
+                .await?;
+
+            // Wait 5 seconds
+            tokio::time::sleep(std::time::Duration::from_secs(5)).await;
+
+            // Deleting the messages
+            bot.delete_message(msg.chat.id, msg.id).await?;
+            bot.delete_message(bot_msg.chat.id, bot_msg.id).await?;
+            return Ok(());
+        }
+    } else {
+        prompt.clone()
+    };
+
+    // Summarize the text using phi-3
+    let model = ModelType::Phi3;
+
+    // Send the stream request using ollama-rs
+    let before_request = std::time::Instant::now();
+    let request = GenerationRequest::new(model.to_string(), text)
+        .system("Summarize this text to the best of your abilities.".to_string());
+    let stream = ollama_client.generate_stream(request).await;
+
+    match stream {
+        Ok(_) => {
+            info!(
+                "Stream request for model {} successful, incoming token responses..",
+                model
+            );
+        }
+        Err(e) => {
+            error!("Stream request failed: {}", e);
+            bot.edit_message_text(
+                generating_message.chat.id,
+                generating_message.id,
+                format!("Failed to generate response: {}", e),
+            )
+            .await?;
+            return Ok(());
+        }
+    }
+
+    let mut stream = stream.unwrap(); // safe unwrap
+
+    // Create a repeating interval that yields every 5 seconds
+    let mut now = std::time::Instant::now();
+
+    // Create a string to hold the entire responseAppend [...] when the bot is still recieving
+    let mut entire_response = String::new();
+    let mut current_message_content = String::new();
+
+    // Parse the response and edit the message every 5 seconds
+    'response_loop: while let Some(Ok(res)) = stream.next().await {
+        for ele in res {
+            // Append the new response to the entire response
+            entire_response.push_str(&ele.response);
+
+            // Check if 5 seconds have passed since last edit
+            if now.elapsed().as_secs() >= INTERVAL_SEC {
+                // Check if the message is identical. Don't know if this is necessary but it's here for now
+                if current_message_content == entire_response {
+                    continue;
+                }
+
+                // Update the current string
+                current_message_content.clone_from(&entire_response);
+
+                // Edit the message
+                bot.edit_message_text(
+                    generating_message.chat.id,
+                    generating_message.id,
+                    current_message_content.clone() + " [...]",
+                )
+                .await?;
+
+                // Send the typing indicator
+                bot.send_chat_action(msg.chat.id, ChatAction::Typing)
+                    .await?;
+
+                // Reset the timer
+                now = std::time::Instant::now();
+            }
+
+            // If the response is done, break the loop
+            if ele.done {
+                break 'response_loop;
+            }
+        }
+    }
+
+    info!("Final response received");
+
+    if entire_response.is_empty() {
+        warn!("No response received!");
+        entire_response = "<no response>".to_string();
+    }
+
+    // Edit the message one last time
+    bot.edit_message_text(
+        generating_message.chat.id,
+        generating_message.id,
+        entire_response.clone().trim_end(),
+    )
+    .await?;
+
+    let elapsed = before_request.elapsed().as_secs_f32();
+
+    info!(
+        "Generated ollama response.\n - Time elapsed: {:.2}s\n - Model: {}\n - Gen. Length: {}",
+        elapsed,
+        model,
+        entire_response.len()
+    );
+
+    Ok(())
+}
diff --git a/src/main.rs b/src/main.rs
@@ -2,26 +2,16 @@ use aws_config::BehaviorVersion;
 use log::info;
 
 use ollama_rs::Ollama;
-use teloxide::{
-    prelude::*,
-    types::{Me, MessageId},
-    utils::command::BotCommands,
-    RequestError,
-};
+use teloxide::{prelude::*, types::Me, utils::command::BotCommands, RequestError};
 mod models;
 
 use models::ModelType;
-use tokio::sync::Mutex;
 
 mod commands;
 use commands::*;
 
 use crate::models::setup_models;
 
-lazy_static::lazy_static! {
-    pub static ref CURRENT_TASKS: Mutex<Vec<MessageId>> = Mutex::new(vec![]);
-}
-
 #[tokio::main]
 async fn main() {
     dotenv::dotenv().ok();
@@ -104,17 +94,12 @@ enum Commands {
         hide
     )]
     ChatLGBT,
-    #[command(
-        description = "generate text using the pplx-7b-online model",
-        hide
-    )]
+    #[command(description = "generate text using the pplx-7b-online model", hide)]
     Online,
     #[command(description = "multimodal GPT-4-vision", alias = "gpt", hide)]
     GPT4,
     #[command(description = "DALLE 3", alias = "dalle", hide)]
     Dalle3,
-    #[command(description = "generate Polish text using the bielik model")]
-    Bielik,
     #[command(description = "generate text using 70B LLAMA 3 model", aliases = ["llama", "l"])]
     LLAMA3,
     #[command(
@@ -157,6 +142,11 @@ enum Commands {
     Claude3,
     #[command(description = "respond to an image using llava phi3", alias = "llava")]
     Vision,
+    #[command(
+        description = "custom bawialniaGPT model (nonsense model)",
+        alias = "bawialnia"
+    )]
+    BawialniaGPT,
 }
 
 // Handler function for bot events
@@ -175,6 +165,15 @@ async fn handler(
             .trim()
             .to_string();
         match BotCommands::parse(text, me.username()) {
+            Ok(Commands::BawialniaGPT) => {
+                tokio::spawn(ollama(
+                    bot.clone(),
+                    msg.clone(),
+                    get_prompt(trimmed_text, &msg),
+                    ModelType::BawialniaGPT,
+                    ollama_client,
+                ));
+            }
             Ok(Commands::Claude3) => {
                 tokio::spawn(bedrock(
                     bot.clone(),
@@ -392,15 +391,6 @@ async fn handler(
                     ModelType::LLAMA3,
                 ));
             }
-            Ok(Commands::Bielik) => {
-                tokio::spawn(ollama(
-                    bot.clone(),
-                    msg.clone(),
-                    get_prompt(trimmed_text, &msg),
-                    ModelType::Bielik,
-                    ollama_client,
-                ));
-            }
 
             Ok(Commands::Online) => {
                 tokio::spawn(perplexity(