stellarnode
diff --git a/‎youtubevideotranscriptbot/model_params.py‎
Lines changed: 104 additions & 0 deletions b/‎youtubevideotranscriptbot/model_params.py‎
Lines changed: 104 additions & 0 deletions
diff --git a/‎youtubevideotranscriptbot/requirements.txt‎
Lines changed: 2 additions & 1 deletion b/‎youtubevideotranscriptbot/requirements.txt‎
Lines changed: 2 additions & 1 deletion
diff --git a/‎youtubevideotranscriptbot/summarize.py‎
Lines changed: 58 additions & 43 deletions b/‎youtubevideotranscriptbot/summarize.py‎
Lines changed: 58 additions & 43 deletions
@@ -0,0 +1,104 @@
+# model_params.py
+import openai
+import deepseek
+import logging
+from config import OPENAI_API_KEY
+from config import DEEPSEEK_API_KEY
+from config import XAI_API_KEY
+from config import ANTHROPIC_API_KEY
+from config import MODEL_TO_USE  # Import the model selection
+import tiktoken
+import math
+import asyncio
+
+# Set up OpenAI
+# openai.api_key = OPENAI_API_KEY
+
+logger = logging.getLogger(__name__)
+
+def get_model_params(model=MODEL_TO_USE):
+    """
+    Returns the model parameters based on the selected model.
+    
+    Args:
+        model (str): The model to use, either 'gpt' for OpenAI or 'deepseek' for DeepSeek.
+    
+    Returns:
+        dict: A dictionary containing the model parameters.
+    """
+    if "gpt" in model.lower():
+        logger.info(f"Using OpenAI {model} model.")
+        return {
+            "tokens_per_chunk": 100000,
+            "max_chunks_allowed": 4,
+            "max_tokens": 1024,
+            "model": model or "gpt-4o-mini",
+            "client": openai.OpenAI(api_key=OPENAI_API_KEY, base_url="https://api.openai.com/v1")
+        }
+    elif "deepseek" in model.lower():
+        logger.info(f"Using DeepSeek {model}.")
+        return {
+            "tokens_per_chunk": 64000,
+            "max_chunks_allowed": 5,
+            "max_tokens": 1024,
+            "model": model or "deepseek-chat",
+            "client": openai.OpenAI(api_key=DEEPSEEK_API_KEY, base_url="https://api.deepseek.com")
+        }
+    elif "grok" in model.lower():
+        logger.info(f"Using xAI Grok {model}.")
+        return {
+            "tokens_per_chunk": 100000,
+            "max_chunks_allowed": 5,
+            "max_tokens": 1024,
+            "model": model or "grok-3-mini",
+            "client": openai.OpenAI(api_key=XAI_API_KEY, base_url="https://api.x.ai/v1")
+        }
+    elif "claude" in model.lower():
+        logger.info(f"Using Anthropic's Claude {model}.")
+        return {
+            "tokens_per_chunk": 180000,
+            "max_chunks_allowed": 3,
+            "max_tokens": 1024,
+            "model": model or "claude-3-haiku-20240307",
+            "client": openai.OpenAI(api_key=ANTHROPIC_API_KEY, base_url="https://api.anthropic.com/v1/")
+        } 
+    else:
+        logger.error("Invalid model selection in config. Please select 'gpt' for OpenAI or 'deepseek' for DeepSeek.")
+        logger.warning("Falling back to DeepSeek model as default.")
+        return {
+            "tokens_per_chunk": 64000,
+            "max_chunks_allowed": 5,
+            "max_tokens": 1024,
+            "model": model or "deepseek-chat",
+            "client": openai.OpenAI(api_key=DEEPSEEK_API_KEY, base_url="https://api.deepseek.com")
+        }
+    
+
+# if MODEL_TO_USE:
+#     if "gpt" in MODEL_TO_USE.lower():
+#         model_to_use = 1  # OpenAI model
+#     elif "deepseek" in MODEL_TO_USE.lower():
+#         model_to_use = 2
+#     else:
+#         logger.error("Invalid model selection in config. Please select 'gpt' for OpenAI or 'deepseek' for DeepSeek.")
+#         logger.warning("Falling back to DeepSeek model as default.")
+#         model_to_use = 2 # 1 for OpenAI, 2 for DeepSeek
+#         raise ValueError("Invalid model selection in config. Please select 'gpt' for OpenAI or 'deepseek' for DeepSeek.")
+
+# if model_to_use == 1:
+#     tokens_per_chunk = 100000
+#     max_chunks_allowed = 4
+#     max_tokens = 1024
+#     model = "gpt-4o-mini"
+#     client = openai.OpenAI(api_key=OPENAI_API_KEY, base_url="https://api.openai.com/v1")
+#     logger.info(f"Using OpenAI {model} model for summarization.")
+# elif model_to_use == 2:
+#     tokens_per_chunk = 64000
+#     max_chunks_allowed = 5
+#     max_tokens = 1024
+#     model = "deepseek-chat"
+#     # for DeepSeek backward compatibility, you can still use `https://api.deepseek.com/v1` as `base_url`.
+#     client = openai.OpenAI(api_key=DEEPSEEK_API_KEY, base_url="https://api.deepseek.com")
+#     logger.info(f"Using DeepSeek {model} for summarization.")
+# else:
+#     logger.error("Invalid model selection. Please select 1 for OpenAI or 2 for DeepSeek.")
@@ -6,4 +6,5 @@ mysql-connector-python==8.1.0
 isodate==0.6.1
 openai==1.65.1 # 0.28.0  # Add this line
 tiktoken==0.9.0
-deepseek==1.0.0
+deepseek==1.0.0
+aiofiles>=0.4.0
@@ -3,11 +3,12 @@
 import deepseek
 import logging
 from translate import translate_text  # Import the translation function
+from translate import split_text
+from model_params import get_model_params
 from config import OPENAI_API_KEY
 from config import DEEPSEEK_API_KEY
 from config import MODEL_TO_USE  # Import the model selection
 import tiktoken
-from translate import split_text
 import math
 import asyncio
 
@@ -16,34 +17,35 @@
 
 logger = logging.getLogger(__name__)
 
-if MODEL_TO_USE:
-    if "gpt" in MODEL_TO_USE.lower():
-        model_to_use = 1  # OpenAI model
-    elif "deepseek" in MODEL_TO_USE.lower():
-        model_to_use = 2
-    else:
-        logger.error("Invalid model selection in config. Please select 'gpt' for OpenAI or 'deepseek' for DeepSeek.")
-        logger.warning("Falling back to DeepSeek model as default.")
-        model_to_use = 2 # 1 for OpenAI, 2 for DeepSeek
-        raise ValueError("Invalid model selection in config. Please select 'gpt' for OpenAI or 'deepseek' for DeepSeek.")
-
-if model_to_use == 1:
-    tokens_per_chunk = 100000
-    max_chunks_allowed = 4
-    max_tokens = 1024
-    model = "gpt-4o-mini"
-    client = openai.OpenAI(api_key=OPENAI_API_KEY, base_url="https://api.openai.com/v1")
-    logger.info(f"Using OpenAI {model} model for summarization.")
-elif model_to_use == 2:
-    tokens_per_chunk = 64000
-    max_chunks_allowed = 3
-    max_tokens = 1024
-    model = "deepseek-chat"
-    # for DeepSeek backward compatibility, you can still use `https://api.deepseek.com/v1` as `base_url`.
-    client = openai.OpenAI(api_key=DEEPSEEK_API_KEY, base_url="https://api.deepseek.com")
-    logger.info(f"Using DeepSeek {model} for summarization.")
-else:
-    logger.error("Invalid model selection. Please select 1 for OpenAI or 2 for DeepSeek.")
+
+# if MODEL_TO_USE:
+#     if "gpt" in MODEL_TO_USE.lower():
+#         model_to_use = 1  # OpenAI model
+#     elif "deepseek" in MODEL_TO_USE.lower():
+#         model_to_use = 2
+#     else:
+#         logger.error("Invalid model selection in config. Please select 'gpt' for OpenAI or 'deepseek' for DeepSeek.")
+#         logger.warning("Falling back to DeepSeek model as default.")
+#         model_to_use = 2 # 1 for OpenAI, 2 for DeepSeek
+#         raise ValueError("Invalid model selection in config. Please select 'gpt' for OpenAI or 'deepseek' for DeepSeek.")
+
+# if model_to_use == 1:
+#     tokens_per_chunk = 100000
+#     max_chunks_allowed = 4
+#     max_tokens = 1024
+#     model = "gpt-4o-mini"
+#     client = openai.OpenAI(api_key=OPENAI_API_KEY, base_url="https://api.openai.com/v1")
+#     logger.info(f"Using OpenAI {model} model for summarization.")
+# elif model_to_use == 2:
+#     tokens_per_chunk = 64000
+#     max_chunks_allowed = 5
+#     max_tokens = 1024
+#     model = "deepseek-chat"
+#     # for DeepSeek backward compatibility, you can still use `https://api.deepseek.com/v1` as `base_url`.
+#     client = openai.OpenAI(api_key=DEEPSEEK_API_KEY, base_url="https://api.deepseek.com")
+#     logger.info(f"Using DeepSeek {model} for summarization.")
+# else:
+#     logger.error("Invalid model selection. Please select 1 for OpenAI or 2 for DeepSeek.")
 
 
 async def summarize_chunk(chunk, language):
@@ -64,21 +66,27 @@ def _summarize_sync(chunk, language):
         estimated_cost (float): The estimated cost of the OpenAI API call.
         word_count (int): The word count of the summary.
     """
+    model_params = get_model_params(MODEL_TO_USE)
+
     try:
         # Define the prompt for summarization
         system_role = "You are a master of extracting pearls of knowledge from YouTube video transcripts. You grasp the very essence and distill it in a concise form for users. You always provide the response in the same language in which the transcript is provided. Your answers are always clear, concise and nicely formatted."
         prompt = (
             f"If I did not have time to read this YouTube video transcript, what are the most important things I absolutely must know. Enlighten me in no more than 200 words. "
             f"Always provide your response in the same language as the transcript. In this case it might be in '{language}' language. Here is the transcript itself:\n\n{chunk}"
         )
+        # prompt = (
+        #     f"If I did not have time to read this YouTube video transcript, what are the most important things I absolutely must know. Enlighten me in no more than 200 words. "
+        #     f"Provide your response strictly in the following language: '{language}'. Here is the transcript itself:\n\n{chunk}"
+        # )
 
-        response = client.chat.completions.create(
-                model=model,
+        response = model_params["client"].chat.completions.create(
+                model=model_params["model"],
                 messages=[
                     {"role": "system", "content": system_role},
                     {"role": "user", "content": prompt},
             ],
-                max_tokens=max_tokens,
+                max_tokens=model_params["max_tokens"],
                 temperature=0.5,
                 stream=False
             )
@@ -113,6 +121,9 @@ async def summarize_text(text, language, num_key_points=3):
         word_count (int): The word count of the summary.
     """
 
+    tokens_per_chunk, max_chunks_allowed, max_tokens, model, client = get_model_params(MODEL_TO_USE).values()
+    logger.info(f"Tokens per chunk: {tokens_per_chunk} of type {type(tokens_per_chunk)}")
+
     try:
         # Load the encoding for the model you're using (e.g., gpt-3.5-turbo)
         encoding = tiktoken.encoding_for_model("gpt-3.5-turbo")
@@ -125,7 +136,7 @@ async def summarize_text(text, language, num_key_points=3):
         raise
 
     if token_count:
-        number_of_chunks = token_count / tokens_per_chunk # 15,000 tokens per chunk for GPT-3.5-turbo
+        number_of_chunks = token_count / int(tokens_per_chunk) # 15,000 tokens per chunk for GPT-3.5-turbo
         logger.info(f"Number of chunks for summarization of the transcript: {number_of_chunks}")
 
     if number_of_chunks > max_chunks_allowed:
@@ -161,17 +172,17 @@ async def summarize_text(text, language, num_key_points=3):
         logger.error(f"Summarization failed: {e}")
         raise
 
-    logger.info(f"Summarization completed for all chunks.\nTotal word count: {total_word_count}.\nTotal tokens used: {total_tokens_used}.\nEstimated cost: ${total_estimated_cost:.2f}")
+    logger.info(f"Summarization completed for all chunks. Total word count: {total_word_count}. Total tokens used: {total_tokens_used}. Estimated cost: ${total_estimated_cost:.2f}")
 
     return combined_summary.strip(), total_tokens_used, total_estimated_cost, total_word_count
 
 
-async def translate_summary_async(summary, src_lang, dest_lang):
-    loop = asyncio.get_event_loop()
-    return await loop.run_in_executor(None, translate_summary, summary, src_lang, dest_lang)
+# async def translate_summary_async(summary, src_lang, dest_lang):
+#     loop = asyncio.get_event_loop()
+#     return await loop.run_in_executor(None, translate_summary, summary, src_lang, dest_lang)
 
 # Translate the summary into the target language
-def translate_summary(summary, src_lang, dest_lang):
+async def translate_summary(summary, src_lang, dest_lang):
     """
     Translates the summary into the target language.
 
@@ -183,8 +194,10 @@ def translate_summary(summary, src_lang, dest_lang):
     Returns:
         translated_summary (str): The translated summary.
     """
+    model_params = get_model_params(MODEL_TO_USE)
+
     try:
-        translated_summary = translate_text(summary, src_lang=src_lang, dest_lang=dest_lang)
+        translated_summary, total_tokens_used, total_estimated_cost, total_word_count = await translate_text(summary, src_lang=src_lang, dest_lang=dest_lang, model_params=model_params)
         if not translated_summary:
             raise Exception("Translation failed.")
         return translated_summary
@@ -212,19 +225,21 @@ async def handle_summarization_request(text, original_language, target_language,
 
     logger.info(f"Summarization is handled for original language '{original_language}' and target '{target_language}'")
 
+    model_params = get_model_params(MODEL_TO_USE)
+
     try:
-        # Summarize the original transcript
+   
         summary, tokens_used, estimated_cost, word_count = await summarize_text(text, original_language, num_key_points)
-
         if target_language == 'orig':
             target_language = original_language
+
         logger.info(f"Summary generated in {target_language} language. Translation skipped.")
 
         # Translate the summary if the target language is not the original language
         if target_language != original_language:
-            summary = await translate_summary_async(summary, src_lang=original_language, dest_lang=target_language)
+            summary = await translate_summary(summary, src_lang=original_language, dest_lang=target_language)
 
-        return summary, tokens_used, estimated_cost, word_count, model
+        return summary, tokens_used, estimated_cost, word_count, model_params['model']
     except Exception as e:
         logger.error(f"Failed to handle summarization request: {e}")
         raise