Spaces:

JaishnaCodz
/

BlogReviewer

Sleeping

App Files Files Community

JaishnaCodz commited on Jul 15

Commit

b63764b

verified ·

1 Parent(s): 5873b0f

Update app.py

Browse files

Files changed (1) hide show

app.py +49 -50

app.py CHANGED Viewed

@@ -10,7 +10,7 @@ import difflib
 # Load model
 reviewer = pipeline("text2text-generation", model="google/flan-t5-base")
-# OCR
 def extract_text_from_image_url(img_url):
     try:
         response = requests.get(img_url)
@@ -20,7 +20,7 @@ def extract_text_from_image_url(img_url):
     except Exception as e:
         return f"❌ OCR Error: {e}"
-# Extract blog
 def extract_text_from_url(url):
     downloaded = trafilatura.fetch_url(url)
     if downloaded:
@@ -28,42 +28,42 @@ def extract_text_from_url(url):
     else:
         return "❌ Blog Error: Could not fetch content from the URL."
-# Highlight differences using difflib
-def highlight_diffs(original, suggestion):
-    diff = difflib.ndiff(original.split(), suggestion.split())
     result = []
-    for token in diff:
-        if token.startswith("- "):
-            result.append(f"~~{token[2:]}~~")
-        elif token.startswith("+ "):
-            result.append(f"**{token[2:]}**")
-        elif token.startswith("  "):
-            result.append(token[2:])
     return " ".join(result)
-# Review lines with diffs
 def review_lines(text):
     lines = text.strip().split('\n')
-    suggestions = []
     for line in lines:
-        if line.strip() == "":
             continue
-        prompt = f"Rewrite this to fix grammar, tone, and remove any offensive language:\n\n{line}"
-        suggestion = reviewer(prompt, max_new_tokens=100)[0]['generated_text'].strip()
-        highlighted = highlight_diffs(line.strip(), suggestion)
-        suggestions.append((line, highlighted, suggestion))
-    return suggestions
 # Finalize accepted suggestions
 def finalize_text(originals, suggestions, decisions):
-    final = []
-    for orig, sugg, keep in zip(originals, suggestions, decisions):
-        final.append(sugg if keep else orig)
-    return "\n".join(final)
-# Gradio app
-with gr.Blocks(theme=gr.themes.Soft(primary_hue="blue")) as app:
-    gr.Markdown("## ✨ BlogChecker AI\nSmart AI reviewer for blog content, with interactive approval and OCR image support.")
     with gr.Row():
         blog_url = gr.Textbox(label="📎 Blog URL")
@@ -76,41 +76,40 @@ with gr.Blocks(theme=gr.themes.Soft(primary_hue="blue")) as app:
         review_btn = gr.Button("🧠 Review Content")
         finalize_btn = gr.Button("✅ Finalize Clean Blog")
-    review_section = gr.Column(visible=False)
-    review_boxes = []  # Will store tuples: (original_box, highlighted_markdown_box, accept_checkbox, clean_suggestion)
     final_output = gr.Textbox(label="📦 Final Clean Blog", lines=10)
-    # Text extraction logic
     def extract_both(url, img_url):
         blog = extract_text_from_url(url)
         ocr = extract_text_from_image_url(img_url) if img_url else ""
         return blog + ("\n" + ocr if ocr else "")
-    # Review processing with diffs
-    def process_review(text):
         results = review_lines(text)
-        review_section.children.clear()
         review_boxes.clear()
-        for i, (orig, highlighted, clean_sugg) in enumerate(results):
-            with review_section:
-                orig_box = gr.Textbox(value=orig, label=f"Original Line {i+1}", interactive=False)
-                markdown_sugg = gr.Markdown(value=highlighted, label=f"Suggested Edit {i+1}")
-                accept_box = gr.Checkbox(label="✅ Accept Suggestion", value=False)
-                review_boxes.append((orig_box, markdown_sugg, accept_box, clean_sugg))
         return gr.update(visible=True)
-    # Finalization logic
-    def collect_dynamic_decisions():
-        originals_vals = [box[0].value for box in review_boxes]
-        clean_suggestions = [box[3] for box in review_boxes]
-        accepts_vals = [box[2].value for box in review_boxes]
-        return finalize_text(originals_vals, clean_suggestions, accepts_vals)
-    # Wire actions
     extract_btn.click(fn=extract_both, inputs=[blog_url, image_url], outputs=combined_text)
-    review_btn.click(fn=process_review, inputs=combined_text, outputs=review_section)
-    finalize_btn.click(fn=collect_dynamic_decisions, outputs=final_output)
 app.launch()

 # Load model
 reviewer = pipeline("text2text-generation", model="google/flan-t5-base")
+# OCR from image URL
 def extract_text_from_image_url(img_url):
     try:
         response = requests.get(img_url)
     except Exception as e:
         return f"❌ OCR Error: {e}"
+# Extract main blog content from URL
 def extract_text_from_url(url):
     downloaded = trafilatura.fetch_url(url)
     if downloaded:
     else:
         return "❌ Blog Error: Could not fetch content from the URL."
+# Highlight diffs using difflib
+def highlight_diffs(orig, suggestion):
+    diff = difflib.ndiff(orig.split(), suggestion.split())
     result = []
+    for word in diff:
+        if word.startswith('- '):
+            result.append(f"~~{word[2:]}~~")
+        elif word.startswith('+ '):
+            result.append(f"**{word[2:]}**")
+        elif word.startswith('  '):
+            result.append(word[2:])
     return " ".join(result)
+# Review line-by-line
 def review_lines(text):
     lines = text.strip().split('\n')
+    reviewed = []
     for line in lines:
+        if not line.strip():
             continue
+        prompt = f"Fix grammar, tone, and clarity:\n\n{line}"
+        response = reviewer(prompt, max_new_tokens=100)[0]['generated_text'].strip()
+        highlighted = highlight_diffs(line.strip(), response)
+        reviewed.append((line.strip(), highlighted, response))
+    return reviewed
 # Finalize accepted suggestions
 def finalize_text(originals, suggestions, decisions):
+    output = []
+    for orig, sugg, accepted in zip(originals, suggestions, decisions):
+        output.append(sugg if accepted else orig)
+    return "\n".join(output)
+# Build Gradio UI
+with gr.Blocks(theme=gr.themes.Soft()) as app:
+    gr.Markdown("## ✨ BlogChecker AI\nSmart blog reviewer with OCR + AI suggestions")
     with gr.Row():
         blog_url = gr.Textbox(label="📎 Blog URL")
         review_btn = gr.Button("🧠 Review Content")
         finalize_btn = gr.Button("✅ Finalize Clean Blog")
+    review_area = gr.Column(visible=False)
     final_output = gr.Textbox(label="📦 Final Clean Blog", lines=10)
+    review_boxes = []
+    # Extract combined content
     def extract_both(url, img_url):
         blog = extract_text_from_url(url)
         ocr = extract_text_from_image_url(img_url) if img_url else ""
         return blog + ("\n" + ocr if ocr else "")
+    # Review and build UI dynamically
+    def do_review(text):
         results = review_lines(text)
+        review_area.children.clear()
         review_boxes.clear()
+        for idx, (orig, highlighted, clean) in enumerate(results):
+            with review_area:
+                orig_box = gr.Textbox(value=orig, label=f"Original Line {idx+1}", interactive=False)
+                markdown_sugg = gr.Markdown(value=highlighted, label=f"Suggested Edit {idx+1}")
+                accept = gr.Checkbox(label="✅ Accept Suggestion", value=False)
+                review_boxes.append((orig_box, clean, accept))
         return gr.update(visible=True)
+    # Compile final clean version
+    def collect_results():
+        originals = [box[0].value for box in review_boxes]
+        suggestions = [box[1] for box in review_boxes]
+        accepts = [box[2].value for box in review_boxes]
+        return finalize_text(originals, suggestions, accepts)
+    # Wire buttons
     extract_btn.click(fn=extract_both, inputs=[blog_url, image_url], outputs=combined_text)
+    review_btn.click(fn=do_review, inputs=combined_text, outputs=review_area)
+    finalize_btn.click(fn=collect_results, outputs=final_output)
 app.launch()