Spaces:

ssaiteja16
/

RagBenchCapstone10

Runtime error

App Files Files Community

Saiteja Solleti commited on Feb 20

Commit

55915f0

1 Parent(s): 14249c4

Revert "tokening"

Browse files

This reverts commit 585864a7c72456302949a2de8f4ae04376afd17f.

Files changed (2) hide show

generationhelper.py +0 -33
requirements.txt +1 -2

generationhelper.py CHANGED Viewed

@@ -1,7 +1,5 @@
 import os
 from groq import Groq
-import time
-import tiktoken
 groq_token = os.getenv("GROQ_TOKEN")
@@ -9,35 +7,6 @@ groq_client = Groq(
     api_key = groq_token
 )
-# Initialize token counter and timestamp
-tokens_used = 0
-start_time = time.time()
-def Count_tokens(text: str, model="gpt-3.5-turbo"):
-    """Counts tokens in the given text using tiktoken."""
-    enc = tiktoken.encoding_for_model(model)
-    return len(enc.encode(text))
-def Enforce_token_limit(prompt, max_tokens_per_minute=6000):
-    """Ensures that token usage stays within the allowed rate limit."""
-    global tokens_used, start_time
-    tokens = Count_tokens(prompt)
-    elapsed_time = time.time() - start_time
-    # If the token limit is exceeded, wait until the reset
-    if tokens_used + tokens > max_tokens_per_minute:
-        if elapsed_time < 60:
-            sleep_time = 60 - elapsed_time
-            print(f"Rate limit reached! Sleeping for {sleep_time:.2f} seconds...")
-            time.sleep(sleep_time)
-        # Reset counter after sleeping
-        tokens_used = 0
-        start_time = time.time()
-    # Update token count
-    tokens_used += tokens
 def GenerateAnswer(query, top_documents, prompt_model, timeout_seconds: int = 30):
@@ -59,8 +28,6 @@ def GenerateAnswer(query, top_documents, prompt_model, timeout_seconds: int = 30
         Answer:
         """
-        Enforce_token_limit(prompt)
         # Call Groq API (Llama 3.3-70B)
         completion = groq_client.chat.completions.create(
             model=prompt_model,

 import os
 from groq import Groq
 groq_token = os.getenv("GROQ_TOKEN")
     api_key = groq_token
 )
 def GenerateAnswer(query, top_documents, prompt_model, timeout_seconds: int = 30):
         Answer:
         """
         # Call Groq API (Llama 3.3-70B)
         completion = groq_client.chat.completions.create(
             model=prompt_model,

requirements.txt CHANGED Viewed

@@ -5,5 +5,4 @@ huggingface_hub
 pymilvus
 nltk
 sentence-transformers
-Groq
-tiktoken

 pymilvus
 nltk
 sentence-transformers
+Groq