Spaces:

Hadiil
/

home23

Sleeping

App Files Files Community

Update app.py

by luck210 - opened Apr 8

base: refs/heads/main

←

from: refs/pr/1

Discussion Files changed

+40

-191

Files changed (1) hide show

app.py +40 -191

app.py CHANGED Viewed

@@ -119,20 +119,29 @@ def get_chatbot_response(user_input: str):
     except Exception as e:
         return f"Error: {str(e)}"
-def translate_text(text: str, target_language: str):
-    """Translate text to any target language using Gemini"""
     if not text:
         return "Please provide text to translate."
     try:
         translator = load_model("translation")
-        prompt = f"Translate this text to {target_language}: {text}"
         response = translator.generate_content(prompt)
         return response.text.strip()
     except Exception as e:
         return f"Translation error: {str(e)}"
 def detect_intent(text: str = None, file: UploadFile = None) -> tuple[str, str]:
-    """Enhanced intent detection with dynamic translation support including bracketed languages"""
     target_language = "English"  # Default
     if file:
@@ -156,12 +165,13 @@ def detect_intent(text: str = None, file: UploadFile = None) -> tuple[str, str]:
     if any(keyword in text_lower for keyword in ['chat', 'talk', 'converse', 'ask gemini']):
         return "chatbot", target_language
-    # Dynamic translation detection with optional brackets
-    translate_match = re.search(r'translate.*to\s+\[?([a-zA-Z]+)\]?:?', text_lower)
     if translate_match:
-        target_language = translate_match.group(1).capitalize()
         return "translate", target_language
     vqa_patterns = [
         r'how (many|much)',
         r'what (color|size|position|shape)',
@@ -173,40 +183,9 @@ def detect_intent(text: str = None, file: UploadFile = None) -> tuple[str, str]:
     if any(re.search(pattern, text_lower) for pattern in vqa_patterns):
         return "visual-qa", target_language
-    summarization_patterns = [
-        r'\b(summar(y|ize|ise)|brief( overview)?)\b',
-        r'\b(long article|text|document)\b',
-        r'\bcan you (summar|brief|condense)\b',
-        r'\b(short summary|brief explanation)\b',
-        r'\b(overview|main points|key ideas)\b',
-        r'\b(tl;?dr|too long didn\'?t read)\b'
-    ]
-    if any(re.search(pattern, text_lower) for pattern in summarization_patterns):
-        return "summarize", target_language
-    question_patterns = [
-        r'\b(what|when|where|why|how|who|which)\b',
-        r'\?',
-        r'\b(explain|tell me|describe|define)\b'
-    ]
-    if any(re.search(pattern, text_lower) for pattern in question_patterns):
-        return "question-answering", target_language
-    generation_patterns = [
-        r'\b(write|generate|create|compose)\b',
-        r'\b(story|poem|essay|text|content)\b'
-    ]
-    if any(re.search(pattern, text_lower) for pattern in generation_patterns):
-        return "text-generation", target_language
-    if len(text) > 100:
-        return "summarize", target_language
     return "chatbot", target_language
 class ProcessResponse(BaseModel):
     response: str
     type: str
@@ -309,14 +288,8 @@ async def process_input(
     text: str = Form(None),
     file: UploadFile = File(None)
 ):
-    """Enhanced unified endpoint with dynamic translation"""
-    start_time = time.time()
-    client_ip = request.client.host
-    logger.info(f"Request from {client_ip}: text={text[:50] + '...' if text and len(text) > 50 else text}, file={file.filename if file else None}")
-    intent, target_language = detect_intent(text, file)
-    logger.info(f"Detected intent: {intent}, target_language: {target_language}")
     try:
         if intent == "chatbot":
             response = get_chatbot_response(text)
@@ -324,156 +297,32 @@ async def process_input(
         elif intent == "translate":
             content = await extract_text_from_file(file) if file else text
-            content = re.sub(r'translate.*to\s+\[?[a-zA-Z]+\]?:?\s*', '', content, flags=re.IGNORECASE).strip()
-            translated_text = translate_text(content, target_language)
-            return {"response": translated_text, "type": "translation"}
-        elif intent == "summarize":
-            content = await extract_text_from_file(file) if file else text
-            summarizer = load_model("summarization")
-            content_length = len(content.split())
-            max_len = max(30, min(150, content_length//2))
-            min_len = max(15, min(30, max_len//2))
-            if len(content) > 1024:
-                chunks = [content[i:i+1024] for i in range(0, len(content), 1024)]
-                summaries = []
-                for chunk in chunks[:3]:
-                    summary = summarizer(
-                        chunk,
-                        max_length=max_len,
-                        min_length=min_len,
-                        do_sample=False,
-                        truncation=True
-                    )
-                    summaries.append(summary[0]['summary_text'])
-                final_summary = " ".join(summaries)
-            else:
-                summary = summarizer(
-                    content,
-                    max_length=max_len,
-                    min_length=min_len,
-                    do_sample=False,
-                    truncation=True
-                )
-                final_summary = summary[0]['summary_text']
-            final_summary = re.sub(r'\s+', ' ', final_summary).strip()
-            return {"response": final_summary, "type": "summary"}
-        elif intent == "question-answering":
-            context = await extract_text_from_file(file) if file else None
-            if not context and not text:
-                raise HTTPException(status_code=400, detail="No context provided")
-            qa_pipeline = load_model("question-answering")
-            if not context and "?" in text:
-                parts = text.split("?", 1)
-                question = parts[0] + "?"
-                context = parts[1].strip() if len(parts) > 1 and parts[1].strip() else text
-            else:
-                question = text if text else "Summarize this document"
-            result = qa_pipeline(
-                question=question,
-                context=context[:2000] if context else text[:2000]
-            )
-            return {"response": result["answer"], "type": "answer"}
-        elif intent == "image-to-text":
-            if not file or not file.content_type.startswith('image/'):
-                raise HTTPException(status_code=400, detail="An image file is required")
-            image = Image.open(io.BytesIO(await file.read()))
-            captioner = load_model("image-to-text")
-            caption = captioner(image, max_new_tokens=50)
-            return {"response": caption[0]['generated_text'], "type": "caption"}
-        elif intent == "visual-qa":
-            if not file or not file.content_type.startswith('image/'):
-                raise HTTPException(status_code=400, detail="An image file is required")
-            if not text:
-                raise HTTPException(status_code=400, detail="A question is required for VQA")
-            image = Image.open(io.BytesIO(await file.read())).convert("RGB")
-            vqa_pipeline = load_model("visual-qa")
-            question = text.strip()
-            if not question.endswith('?'):
-                question += '?'
-            answer = vqa_pipeline(
-                image=image,
-                question=question
-            )
-            answer = answer.strip()
-            if not answer or answer.lower() == question.lower():
-                logger.warning(f"VQA failed to generate a meaningful answer: {answer}")
-                answer = "I couldn't determine the answer from the image."
-            else:
-                answer = answer.capitalize()
-                if not answer.endswith(('.', '!', '?')):
-                    answer += '.'
-            logger.info(f"Final VQA answer: {answer}")
             return {
-                "response": answer,
-                "type": "visual_qa",
                 "additional_data": {
-                    "question": text,
-                    "image_size": f"{image.width}x{image.height}"
                 }
             }
-        elif intent == "visualize":
-            if not file:
-                raise HTTPException(status_code=400, detail="An Excel file is required")
-            file_content = await file.read()
-            if file.filename.endswith('.csv'):
-                df = pd.read_csv(io.BytesIO(file_content))
-            else:
-                df = pd.read_excel(io.BytesIO(file_content))
-            code = generate_visualization_code(df, text)
-            return {"response": code, "type": "visualization_code"}
-        elif intent == "text-generation":
-            generator = load_model("text-generation")
-            generated = generator(
-                text,
-                max_length=200,
-                num_return_sequences=1,
-                temperature=0.8,
-                top_p=0.92,
-                do_sample=True
-            )
-            return {"response": generated[0]["generated_text"], "type": "generated_text"}
-        else:
-            response = get_chatbot_response(text or "Hello! How can I assist you?")
-            return {"response": response, "type": "chat"}
-    except Exception as e:
-        logger.error(f"Processing error: {str(e)}", exc_info=True)
-        raise HTTPException(status_code=500, detail=str(e))
-    finally:
-        process_time = time.time() - start_time
-        logger.info(f"Request processed in {process_time:.2f} seconds")
 async def extract_text_from_file(file: UploadFile) -> str:
     """Enhanced text extraction with better error handling and format support"""

     except Exception as e:
         return f"Error: {str(e)}"
+def translate_text(text: str, target_language: str) -> str:
+    """Translate text to target language using Gemini with improved error handling"""
     if not text:
         return "Please provide text to translate."
+    if not target_language:
+        return "Please specify a target language."
     try:
         translator = load_model("translation")
+        # Enhanced prompt with clearer instructions
+        prompt = f"Translate the following text to {target_language}. Only provide the translated text without any additional commentary: {text}"
         response = translator.generate_content(prompt)
+        if not response.text or response.text.strip() == text:
+            return f"Translation to {target_language} failed or produced no change."
         return response.text.strip()
     except Exception as e:
+        logger.error(f"Translation error: {str(e)}")
         return f"Translation error: {str(e)}"
 def detect_intent(text: str = None, file: UploadFile = None) -> tuple[str, str]:
+    """Enhanced intent detection with improved translation handling"""
     target_language = "English"  # Default
     if file:
     if any(keyword in text_lower for keyword in ['chat', 'talk', 'converse', 'ask gemini']):
         return "chatbot", target_language
+    # Improved translation detection
+    translate_match = re.search(r'translate.*to\s+\[?([a-zA-Z\s]+)\]?:?', text_lower)
     if translate_match:
+        target_language = translate_match.group(1).strip().capitalize()
         return "translate", target_language
+    # Rest of the function remains the same...
     vqa_patterns = [
         r'how (many|much)',
         r'what (color|size|position|shape)',
     if any(re.search(pattern, text_lower) for pattern in vqa_patterns):
         return "visual-qa", target_language
+    # ... remaining patterns ...
     return "chatbot", target_language
 class ProcessResponse(BaseModel):
     response: str
     type: str
     text: str = Form(None),
     file: UploadFile = File(None)
 ):
+    # ... previous code ...
     try:
         if intent == "chatbot":
             response = get_chatbot_response(text)
         elif intent == "translate":
             content = await extract_text_from_file(file) if file else text
+            if not content:
+                raise HTTPException(status_code=400, detail="No content to translate")
+            # Clean the input text from translation command
+            content_to_translate = re.sub(
+                r'translate.*to\s+\[?[a-zA-Z\s]+\]?:?\s*',
+                '',
+                content,
+                flags=re.IGNORECASE
+            ).strip()
+            if not content_to_translate:
+                raise HTTPException(status_code=400, detail="No text remains after parsing translation command")
+            translated_text = translate_text(content_to_translate, target_language)
             return {
+                "response": translated_text,
+                "type": "translation",
                 "additional_data": {
+                    "original_text": content_to_translate,
+                    "target_language": target_language
                 }
             }
+        # ... rest of the endpoint code ...
 async def extract_text_from_file(file: UploadFile) -> str:
     """Enhanced text extraction with better error handling and format support"""