Initial commit: hardened DeerFlow factory

Vendored deer-flow upstream (bytedance/deer-flow) plus prompt-injection hardening: - New deerflow.security package: content_delimiter, html_cleaner, sanitizer (8 layers — invisible chars, control chars, symbols, NFC, PUA, tag chars, horizontal whitespace collapse with newline/tab preservation, length cap) - New deerflow.community.searx package: web_search, web_fetch, image_search backed by a private SearX instance, every external string sanitized and wrapped in <<<EXTERNAL_UNTRUSTED_CONTENT>>> delimiters - All native community web providers (ddg_search, tavily, exa, firecrawl, jina_ai, infoquest, image_search) replaced with hard-fail stubs that raise NativeWebToolDisabledError at import time, so a misconfigured tool.use path fails loud rather than silently falling back to unsanitized output - Native client back-doors (jina_client.py, infoquest_client.py) stubbed too - Native-tool tests quarantined under tests/_disabled_native/ (collect_ignore_glob via local conftest.py) - Sanitizer Layer 7 fix: only collapse horizontal whitespace, preserve newlines and tabs so list/table structure survives - Hardened runtime config.yaml references only the searx-backed tools - Factory overlay (backend/) kept in sync with deer-flow tree as a reference / source See HARDENING.md for the full audit trail and verification steps.
2026-04-12 14:23:57 +02:00
commit 6de0bf9f5b
889 changed files with 173052 additions and 0 deletions
--- a/deer-flow/skills/public/ppt-generation/scripts/generate.py
+++ b/deer-flow/skills/public/ppt-generation/scripts/generate.py
@@ -0,0 +1,161 @@
+import json
+import os
+from io import BytesIO
+
+from PIL import Image
+from pptx import Presentation
+from pptx.util import Inches
+
+
+def generate_ppt(
+    plan_file: str,
+    slide_images: list[str],
+    output_file: str,
+) -> str:
+    """
+    Generate a PowerPoint presentation from slide images.
+
+    Args:
+        plan_file: Path to JSON file containing presentation plan
+        slide_images: List of paths to slide images in order
+        output_file: Path to output PPTX file
+
+    Returns:
+        Status message
+    """
+    # Load presentation plan
+    with open(plan_file, "r", encoding="utf-8") as f:
+        plan = json.load(f)
+
+    # Determine slide dimensions based on aspect ratio
+    aspect_ratio = plan.get("aspect_ratio", "16:9")
+    if aspect_ratio == "16:9":
+        slide_width = Inches(13.333)
+        slide_height = Inches(7.5)
+    elif aspect_ratio == "4:3":
+        slide_width = Inches(10)
+        slide_height = Inches(7.5)
+    else:
+        # Default to 16:9
+        slide_width = Inches(13.333)
+        slide_height = Inches(7.5)
+
+    # Create presentation with specified dimensions
+    prs = Presentation()
+    prs.slide_width = slide_width
+    prs.slide_height = slide_height
+
+    # Get blank layout
+    blank_layout = prs.slide_layouts[6]  # Blank layout
+
+    # Add each slide image
+    slides_info = plan.get("slides", [])
+
+    for i, image_path in enumerate(slide_images):
+        if not os.path.exists(image_path):
+            return f"Error: Slide image not found: {image_path}"
+
+        # Add a blank slide
+        slide = prs.slides.add_slide(blank_layout)
+
+        # Load and process image
+        with Image.open(image_path) as img:
+            # Convert to RGB if necessary (for PNG with transparency)
+            if img.mode in ("RGBA", "P"):
+                img = img.convert("RGB")
+
+            # Calculate dimensions to fill slide while maintaining aspect ratio
+            img_width, img_height = img.size
+            img_aspect = img_width / img_height
+            slide_aspect = slide_width / slide_height
+
+            # Convert to EMU for calculations
+            slide_width_emu = int(slide_width)
+            slide_height_emu = int(slide_height)
+
+            if img_aspect > slide_aspect:
+                # Image is wider - fit to width
+                new_width_emu = slide_width_emu
+                new_height_emu = int(slide_width_emu / img_aspect)
+                left = Inches(0)
+                top = Inches((slide_height_emu - new_height_emu) / 914400)
+            else:
+                # Image is taller - fit to height
+                new_height_emu = slide_height_emu
+                new_width_emu = int(slide_height_emu * img_aspect)
+                left = Inches((slide_width_emu - new_width_emu) / 914400)
+                top = Inches(0)
+
+            # Save processed image to bytes
+            img_bytes = BytesIO()
+            img.save(img_bytes, format="JPEG", quality=95)
+            img_bytes.seek(0)
+
+            # Add image to slide
+            slide.shapes.add_picture(
+                img_bytes, left, top, Inches(new_width_emu / 914400), Inches(new_height_emu / 914400)
+            )
+
+        # Add speaker notes if available in plan
+        if i < len(slides_info):
+            slide_info = slides_info[i]
+            notes = []
+
+            if slide_info.get("title"):
+                notes.append(f"Title: {slide_info['title']}")
+
+            if slide_info.get("subtitle"):
+                notes.append(f"Subtitle: {slide_info['subtitle']}")
+
+            if slide_info.get("key_points"):
+                notes.append("Key Points:")
+                for point in slide_info["key_points"]:
+                    notes.append(f"  • {point}")
+
+            if notes:
+                notes_slide = slide.notes_slide
+                text_frame = notes_slide.notes_text_frame
+                if text_frame is not None:
+                    text_frame.text = "\n".join(notes)
+
+    # Save presentation
+    prs.save(output_file)
+
+    return f"Successfully generated presentation with {len(slide_images)} slides to {output_file}"
+
+
+if __name__ == "__main__":
+    import argparse
+
+    parser = argparse.ArgumentParser(
+        description="Generate PowerPoint presentation from slide images"
+    )
+    parser.add_argument(
+        "--plan-file",
+        required=True,
+        help="Absolute path to JSON presentation plan file",
+    )
+    parser.add_argument(
+        "--slide-images",
+        nargs="+",
+        required=True,
+        help="Absolute paths to slide images in order (space-separated)",
+    )
+    parser.add_argument(
+        "--output-file",
+        required=True,
+        help="Output path for generated PPTX file",
+    )
+
+    args = parser.parse_args()
+
+    try:
+        print(
+            generate_ppt(
+                args.plan_file,
+                args.slide_images,
+                args.output_file,
+            )
+        )
+    except Exception as e:
+        print(f"Error while generating presentation: {e}")