bot.py

#!/usr/bin/env python3
"""
Discord bot for #remora channel - analyzes links in real-time with web_fetch + AI
Posts summaries, adds to Tududi inbox, maintains JSON history + logs
"""

import discord
import os
import json
import re
import requests
from datetime import datetime
from pathlib import Path
from dotenv import load_dotenv
import logging
from urllib.parse import urlparse

# Load .env file
load_dotenv()

# Setup logging
log_file = Path(__file__).parent / "bot.log"
logging.basicConfig(
    level=logging.DEBUG,
    format='[%(asctime)s] [%(levelname)-8s] %(message)s',
    handlers=[
        logging.FileHandler(log_file),
        logging.StreamHandler()
    ]
)
logger = logging.getLogger(__name__)

# Config
CHANNEL_ID = 1467557082583535729
TRACKER_FILE = Path(__file__).parent / "tracker.json"
TUDUDI_API_URL = os.getenv("TUDUDI_API_URL", "https://todo.dilain.com/api/v1")
TUDUDI_API_KEY = os.getenv("TUDUDI_API_KEY")
GATEWAY_URL = os.getenv("OPENCLAW_GATEWAY", "http://127.0.0.1:18789")
GATEWAY_TOKEN = os.getenv("OPENCLAW_GATEWAY_TOKEN", "")

logger.info("=" * 60)
logger.info("Bot startup")
logger.info(f"  Channel ID: {CHANNEL_ID}")
logger.info(f"  Tududi API: {TUDUDI_API_URL}")
logger.info(f"  Gateway: {GATEWAY_URL}")
logger.info("=" * 60)

# Load or init tracker
def load_tracker():
    if TRACKER_FILE.exists():
        with open(TRACKER_FILE) as f:
            return json.load(f)
    return {
        "channel_id": CHANNEL_ID,
        "processed_message_ids": [],
        "links": []
    }

def save_tracker(data):
    with open(TRACKER_FILE, "w") as f:
        json.dump(data, f, indent=2)

# Detect links in text
def extract_urls(text):
    url_pattern = r'https?://[^\s<>"{}|\\^`\[\]]+'
    return re.findall(url_pattern, text)

# Detect link type
def detect_link_type(url):
    domain = urlparse(url).netloc.lower()
    
    if "github.com" in domain:
        return "GitHub"
    elif "reddit.com" in domain:
        return "Reddit"
    elif "youtube.com" in domain or "youtu.be" in domain:
        return "YouTube"
    elif "tiktok.com" in domain:
        return "TikTok"
    elif "twitter.com" in domain or "x.com" in domain:
        return "Twitter/X"
    elif "medium.com" in domain:
        return "Medium"
    elif "dev.to" in domain:
        return "Dev.to"
    elif "arxiv.org" in domain:
        return "arXiv"
    else:
        return "Article"

# Fetch URL content using requests
def fetch_url_content(url):
    """Fetch URL and return title + excerpt"""
    logger.debug(f"  📥 Fetching: {url}")
    
    try:
        response = requests.get(
            url,
            timeout=8,
            headers={
                'User-Agent': 'Mozilla/5.0 (X11; Linux x86_64) AppleWebKit/537.36',
                'Accept': 'text/html,application/xhtml+xml'
            },
            allow_redirects=True
        )
        response.raise_for_status()
        content = response.text[:4000]  # First 4k chars
        
        # Try multiple patterns for title
        title = None
        
        # Pattern 1: <title> tag
        title_match = re.search(r'<title[^>]*>\s*([^<]+?)\s*</title>', content, re.IGNORECASE)
        if title_match:
            title = title_match.group(1).strip()
        
        # Pattern 2: og:title meta tag (for GitHub, etc.)
        if not title:
            og_match = re.search(r'<meta\s+property="og:title"\s+content="([^"]+)"', content, re.IGNORECASE)
            if og_match:
                title = og_match.group(1).strip()
        
        # Pattern 3: h1 tag (for GitHub README)
        if not title:
            h1_match = re.search(r'<h1[^>]*>([^<]+)</h1>', content, re.IGNORECASE)
            if h1_match:
                title = h1_match.group(1).strip()
        
        # Fallback
        if not title:
            title = url.split('/')[-1] or "Untitled"
        
        # Extract meta description
        desc_match = re.search(r'<meta\s+name="description"\s+content="([^"]+)"', content, re.IGNORECASE)
        description = desc_match.group(1) if desc_match else ""
        
        # Extract og:description
        if not description:
            og_desc = re.search(r'<meta\s+property="og:description"\s+content="([^"]+)"', content, re.IGNORECASE)
            if og_desc:
                description = og_desc.group(1)
        
        logger.debug(f"    ✓ Fetched: {title}")
        return {
            "title": title,
            "description": description,
            "content": content,
            "status": "ok"
        }
    except requests.Timeout:
        logger.warning(f"    ⏱️ Timeout: {url}")
        return {"title": "Request timeout", "status": "timeout", "content": ""}
    except requests.HTTPError as e:
        logger.warning(f"    ❌ HTTP {e.response.status_code}: {url}")
        return {"title": f"HTTP {e.response.status_code}", "status": "http_error", "content": ""}
    except Exception as e:
        logger.error(f"    ❌ Error: {e}")
        return {"title": "Fetch failed", "status": "error", "error": str(e), "content": ""}

# Analyze content (local heuristic-based)
def analyze_content(url, title, content, link_type):
    """Analyze content and suggest summary + tag locally"""
    logger.debug(f"  🤖 Analyzing content: {url}")
    logger.debug(f"    Content length: {len(content)} chars")
    logger.debug(f"    Link type: {link_type}")
    
    try:
        # Extract useful info from HTML content
        description = ""
        
        # Looking for meta description
        desc_match = re.search(r'<meta\s+name="description"\s+content="([^"]+)"', content, re.IGNORECASE)
        if desc_match:
            description = desc_match.group(1).strip()
            logger.debug(f"    Found meta description: {description[:80]}")
        
        # Looking for og:description
        if not description:
            og_desc = re.search(r'<meta\s+property="og:description"\s+content="([^"]+)"', content, re.IGNORECASE)
            if og_desc:
                description = og_desc.group(1).strip()
                logger.debug(f"    Found og:description: {description[:80]}")
        
        # Looking for first paragraph after title
        if not description:
            p_match = re.search(r'<p[^>]*>([^<]+)</p>', content, re.IGNORECASE)
            if p_match:
                description = p_match.group(1).strip()[:200]
        
        # Determine tag based on content + URL + type
        tag = "interesting"
        summary = ""
        
        if link_type == "GitHub":
            tag = "project"
            summary = f"GitHub repository: {title}"
            # Try to extract more info from README
            readme_match = re.search(r'README[^<]*</h[1-3]>[^<]*<p[^>]*>([^<]+)', content, re.IGNORECASE)
            if readme_match:
                summary += f". {readme_match.group(1)[:100]}"
        
        elif link_type == "YouTube":
            tag = "video"
            summary = f"Video: {title}"
            if description:
                summary += f". {description[:80]}"
        
        elif link_type == "Reddit":
            tag = "discussion"
            summary = f"Reddit discussion: {title}"
        
        elif link_type == "Medium" or link_type == "Dev.to":
            tag = "article"
            summary = f"Article: {title}"
            if description:
                summary += f". {description[:80]}"
        
        elif link_type == "arXiv":
            tag = "learning"
            summary = f"Research paper: {title}"
        
        else:
            # Generic web article
            tag = "to-read"
            summary = title
            if description:
                summary += f". {description[:100]}"
        
        # Truncate summary to reasonable length
        summary = summary[:200]
        
        logger.info(f"    ✓ Analysis complete - Tag: {tag}, Summary: {summary[:60]}")
        
        result = {
            "summary": summary,
            "tag": tag,
            "relevance": "relevant"
        }
        logger.debug(f"    Returning: {result}")
        return result
        
    except Exception as e:
        logger.error(f"    Analysis error: {e}")
        import traceback
        logger.error(traceback.format_exc())
        # Return minimal analysis
        return {
            "summary": title,
            "tag": "interesting",
            "relevance": "relevant"
        }

# Send to Tududi inbox
def add_to_tududi(title, url, link_type, summary="", tag=""):
    """Add to Tududi inbox with intelligent summary"""
    logger.debug(f"  📌 Adding to Tududi: {title}")
    
    try:
        if not TUDUDI_API_KEY:
            logger.warning("    TUDUDI_API_KEY not set")
            return False
        
        # Format the inbox content
        content = f"📌 **{link_type}**: {title}\n🔗 {url}"
        
        if summary:
            content += f"\n\n💡 **Summary**:\n{summary}"
        
        if tag:
            content += f"\n\n🏷️ **Tag**: {tag}"
        
        response = requests.post(
            f"{TUDUDI_API_URL}/inbox",
            headers={
                "Authorization": f"Bearer {TUDUDI_API_KEY}",
                "Content-Type": "application/json"
            },
            json={"content": content},
            timeout=5
        )
        
        if response.status_code in [200, 201]:  # 200 or 201 are both OK
            logger.info(f"    ✓ Added to Tududi inbox with tag: {tag}")
            return True
        else:
            logger.warning(f"    Tududi error: {response.status_code}")
            return False
    except Exception as e:
        logger.error(f"    Tududi error: {e}")
        return False

# Discord bot
intents = discord.Intents.default()
intents.message_content = True

class LinkAnalyzerBot(discord.Client):
    async def on_ready(self):
        logger.info(f"✅ Bot logged in as {self.user}")
        logger.info(f"📍 Watching channel #remora ({CHANNEL_ID})")

    async def on_message(self, message):
        # Ignore bot's own messages
        if message.author == self.user:
            return
        
        # Only process #remora channel
        if message.channel.id != CHANNEL_ID:
            return
        
        # Check for URLs
        urls = extract_urls(message.content)
        if not urls:
            logger.debug(f"No URLs in message from {message.author}")
            return
        
        # Skip if already processed
        tracker = load_tracker()
        if message.id in tracker["processed_message_ids"]:
            logger.debug(f"Skipping already-processed message {message.id}")
            return
        
        logger.info(f"🔗 New link(s) from {message.author}: {message.content}")
        
        # Process each URL
        for url in urls:
            try:
                logger.info(f"Processing: {url}")
                link_type = detect_link_type(url)
                
                # Fetch content
                fetch_result = fetch_url_content(url)
                title = fetch_result["title"]
                
                # Analyze content if fetch was successful
                analysis_data = None
                logger.debug(f"  📊 Fetch status: {fetch_result['status']}")
                
                if fetch_result["status"] == "ok":
                    logger.debug(f"  🔍 Starting analysis...")
                    analysis_data = analyze_content(url, title, fetch_result.get("content", ""), link_type)
                    logger.debug(f"  Analysis result: {analysis_data}")
                else:
                    logger.debug(f"  ⚠️ Fetch failed, skipping analysis")
                
                # Prepare summary for Tududi
                summary_text = ""
                tag = "interesting"
                if analysis_data:
                    summary_text = analysis_data.get("summary", "")
                    tag = analysis_data.get("tag", "interesting")
                    logger.debug(f"  ✓ Got summary: {summary_text[:80]}")
                else:
                    logger.warning(f"  ❌ No analysis data returned")
                
                # Add to Tududi with summary
                tududi_ok = add_to_tududi(title, url, link_type, summary_text, tag)
                
                # Format response for Discord
                response_text = f"📌 **{link_type}**: {title}"
                if summary_text:
                    response_text += f"\n\n💡 {summary_text}"
                if tag:
                    response_text += f"\n\n🏷️ Tag: `{tag}`"
                
                logger.debug(f"Posting response: {response_text}")
                
                # Post in channel
                await message.reply(response_text, mention_author=False)
                
                # Update tracker
                tracker["links"].append({
                    "url": url,
                    "title": title,
                    "type": link_type,
                    "author": str(message.author),
                    "message_id": message.id,
                    "date": datetime.now().isoformat(),
                    "analysis": analysis_data,
                    "tududi": tududi_ok,
                    "fetch_status": fetch_result["status"]
                })
                
                logger.info(f"✓ Processed: {url}")
                
            except Exception as e:
                logger.error(f"❌ Error processing {url}: {e}")
                await message.reply(f"❌ Error analyzing link: {e}", mention_author=False)
        
        # Update processed IDs
        tracker["processed_message_ids"].append(message.id)
        save_tracker(tracker)
        logger.info(f"Updated tracker, total links: {len(tracker['links'])}")

# Main
if __name__ == "__main__":
    token = os.getenv("DISCORD_BOT_TOKEN")
    if not token:
        logger.error("❌ DISCORD_BOT_TOKEN not set!")
        exit(1)
    
    logger.info("Starting bot...")
    bot = LinkAnalyzerBot(intents=intents)
    bot.run(token)
Initial: Link analyzer bot for #remora channel 2026-02-09 18:07:14 +01:00			`#!/usr/bin/env python3`
			`"""`
Feat: Add web_fetch, AI analysis (Haiku), and comprehensive logging 2026-02-09 18:46:45 +01:00			`Discord bot for #remora channel - analyzes links in real-time with web_fetch + AI`
			`Posts summaries, adds to Tududi inbox, maintains JSON history + logs`
Initial: Link analyzer bot for #remora channel 2026-02-09 18:07:14 +01:00			`"""`

			`import discord`
			`import os`
			`import json`
			`import re`
			`import requests`
			`from datetime import datetime`
			`from pathlib import Path`
			`from dotenv import load_dotenv`
Feat: Add web_fetch, AI analysis (Haiku), and comprehensive logging 2026-02-09 18:46:45 +01:00			`import logging`
			`from urllib.parse import urlparse`
Initial: Link analyzer bot for #remora channel 2026-02-09 18:07:14 +01:00
			`# Load .env file`
			`load_dotenv()`

Feat: Add web_fetch, AI analysis (Haiku), and comprehensive logging 2026-02-09 18:46:45 +01:00			`# Setup logging`
			`log_file = Path(__file__).parent / "bot.log"`
			`logging.basicConfig(`
			`level=logging.DEBUG,`
			`format='[%(asctime)s] [%(levelname)-8s] %(message)s',`
			`handlers=[`
			`logging.FileHandler(log_file),`
			`logging.StreamHandler()`
			`]`
			`)`
			`logger = logging.getLogger(__name__)`

Initial: Link analyzer bot for #remora channel 2026-02-09 18:07:14 +01:00			`# Config`
			`CHANNEL_ID = 1467557082583535729`
			`TRACKER_FILE = Path(__file__).parent / "tracker.json"`
			`TUDUDI_API_URL = os.getenv("TUDUDI_API_URL", "https://todo.dilain.com/api/v1")`
			`TUDUDI_API_KEY = os.getenv("TUDUDI_API_KEY")`
			`GATEWAY_URL = os.getenv("OPENCLAW_GATEWAY", "http://127.0.0.1:18789")`
Feat: Add web_fetch, AI analysis (Haiku), and comprehensive logging 2026-02-09 18:46:45 +01:00			`GATEWAY_TOKEN = os.getenv("OPENCLAW_GATEWAY_TOKEN", "")`

			`logger.info("=" * 60)`
			`logger.info("Bot startup")`
			`logger.info(f" Channel ID: {CHANNEL_ID}")`
			`logger.info(f" Tududi API: {TUDUDI_API_URL}")`
			`logger.info(f" Gateway: {GATEWAY_URL}")`
			`logger.info("=" * 60)`
Initial: Link analyzer bot for #remora channel 2026-02-09 18:07:14 +01:00
			`# Load or init tracker`
			`def load_tracker():`
			`if TRACKER_FILE.exists():`
			`with open(TRACKER_FILE) as f:`
			`return json.load(f)`
			`return {`
			`"channel_id": CHANNEL_ID,`
			`"processed_message_ids": [],`
			`"links": []`
			`}`

			`def save_tracker(data):`
			`with open(TRACKER_FILE, "w") as f:`
			`json.dump(data, f, indent=2)`

			`# Detect links in text`
			`def extract_urls(text):`
			url_pattern = r'https?://[^\s<>"{}\|\\^`\[\]]+'
			`return re.findall(url_pattern, text)`

Feat: Add web_fetch, AI analysis (Haiku), and comprehensive logging 2026-02-09 18:46:45 +01:00			`# Detect link type`
			`def detect_link_type(url):`
			`domain = urlparse(url).netloc.lower()`

			`if "github.com" in domain:`
			`return "GitHub"`
			`elif "reddit.com" in domain:`
			`return "Reddit"`
			`elif "youtube.com" in domain or "youtu.be" in domain:`
			`return "YouTube"`
			`elif "tiktok.com" in domain:`
			`return "TikTok"`
			`elif "twitter.com" in domain or "x.com" in domain:`
			`return "Twitter/X"`
			`elif "medium.com" in domain:`
			`return "Medium"`
			`elif "dev.to" in domain:`
			`return "Dev.to"`
			`elif "arxiv.org" in domain:`
			`return "arXiv"`
			`else:`
			`return "Article"`

			`# Fetch URL content using requests`
			`def fetch_url_content(url):`
			`"""Fetch URL and return title + excerpt"""`
			`logger.debug(f" 📥 Fetching: {url}")`

Initial: Link analyzer bot for #remora channel 2026-02-09 18:07:14 +01:00			`try:`
Feat: Add web_fetch, AI analysis (Haiku), and comprehensive logging 2026-02-09 18:46:45 +01:00			`response = requests.get(`
			`url,`
Improve: Better title extraction (og:title, h1), description parsing, disable gateway for now 2026-02-09 18:50:14 +01:00			`timeout=8,`
			`headers={`
			`'User-Agent': 'Mozilla/5.0 (X11; Linux x86_64) AppleWebKit/537.36',`
			`'Accept': 'text/html,application/xhtml+xml'`
			`},`
Feat: Add web_fetch, AI analysis (Haiku), and comprehensive logging 2026-02-09 18:46:45 +01:00			`allow_redirects=True`
			`)`
			`response.raise_for_status()`
Improve: Better title extraction (og:title, h1), description parsing, disable gateway for now 2026-02-09 18:50:14 +01:00			`content = response.text[:4000] # First 4k chars`

			`# Try multiple patterns for title`
			`title = None`

			`# Pattern 1: <title> tag`
			`title_match = re.search(r'<title[^>]>\s([^<]+?)\s*</title>', content, re.IGNORECASE)`
			`if title_match:`
			`title = title_match.group(1).strip()`
Initial: Link analyzer bot for #remora channel 2026-02-09 18:07:14 +01:00
Improve: Better title extraction (og:title, h1), description parsing, disable gateway for now 2026-02-09 18:50:14 +01:00			`# Pattern 2: og:title meta tag (for GitHub, etc.)`
			`if not title:`
			`og_match = re.search(r'<meta\s+property="og:title"\s+content="([^"]+)"', content, re.IGNORECASE)`
			`if og_match:`
			`title = og_match.group(1).strip()`

			`# Pattern 3: h1 tag (for GitHub README)`
			`if not title:`
			`h1_match = re.search(r'<h1[^>]*>([^<]+)</h1>', content, re.IGNORECASE)`
			`if h1_match:`
			`title = h1_match.group(1).strip()`

			`# Fallback`
			`if not title:`
			`title = url.split('/')[-1] or "Untitled"`
Initial: Link analyzer bot for #remora channel 2026-02-09 18:07:14 +01:00
Feat: Add web_fetch, AI analysis (Haiku), and comprehensive logging 2026-02-09 18:46:45 +01:00			`# Extract meta description`
			`desc_match = re.search(r'<meta\s+name="description"\s+content="([^"]+)"', content, re.IGNORECASE)`
			`description = desc_match.group(1) if desc_match else ""`
Initial: Link analyzer bot for #remora channel 2026-02-09 18:07:14 +01:00
Improve: Better title extraction (og:title, h1), description parsing, disable gateway for now 2026-02-09 18:50:14 +01:00			`# Extract og:description`
			`if not description:`
			`og_desc = re.search(r'<meta\s+property="og:description"\s+content="([^"]+)"', content, re.IGNORECASE)`
			`if og_desc:`
			`description = og_desc.group(1)`

Feat: Add web_fetch, AI analysis (Haiku), and comprehensive logging 2026-02-09 18:46:45 +01:00			`logger.debug(f" ✓ Fetched: {title}")`
Initial: Link analyzer bot for #remora channel 2026-02-09 18:07:14 +01:00			`return {`
			`"title": title,`
Feat: Add web_fetch, AI analysis (Haiku), and comprehensive logging 2026-02-09 18:46:45 +01:00			`"description": description,`
			`"content": content,`
Initial: Link analyzer bot for #remora channel 2026-02-09 18:07:14 +01:00			`"status": "ok"`
			`}`
Feat: Add web_fetch, AI analysis (Haiku), and comprehensive logging 2026-02-09 18:46:45 +01:00			`except requests.Timeout:`
			`logger.warning(f" ⏱️ Timeout: {url}")`
			`return {"title": "Request timeout", "status": "timeout", "content": ""}`
			`except requests.HTTPError as e:`
			`logger.warning(f" ❌ HTTP {e.response.status_code}: {url}")`
			`return {"title": f"HTTP {e.response.status_code}", "status": "http_error", "content": ""}`
Initial: Link analyzer bot for #remora channel 2026-02-09 18:07:14 +01:00			`except Exception as e:`
Feat: Add web_fetch, AI analysis (Haiku), and comprehensive logging 2026-02-09 18:46:45 +01:00			`logger.error(f" ❌ Error: {e}")`
			`return {"title": "Fetch failed", "status": "error", "error": str(e), "content": ""}`

Improve: Local heuristic-based analysis (no subprocess needed, fast) 2026-02-09 19:05:31 +01:00			`# Analyze content (local heuristic-based)`
Feature: AI-powered intelligent summaries with sub-agents (analyze + tag) 2026-02-09 18:56:26 +01:00			`def analyze_content(url, title, content, link_type):`
Improve: Local heuristic-based analysis (no subprocess needed, fast) 2026-02-09 19:05:31 +01:00			`"""Analyze content and suggest summary + tag locally"""`
Feature: AI-powered intelligent summaries with sub-agents (analyze + tag) 2026-02-09 18:56:26 +01:00			`logger.debug(f" 🤖 Analyzing content: {url}")`
Debug: Add detailed logging for analysis pipeline 2026-02-09 19:11:34 +01:00			`logger.debug(f" Content length: {len(content)} chars")`
			`logger.debug(f" Link type: {link_type}")`
Feat: Add web_fetch, AI analysis (Haiku), and comprehensive logging 2026-02-09 18:46:45 +01:00
			`try:`
Improve: Local heuristic-based analysis (no subprocess needed, fast) 2026-02-09 19:05:31 +01:00			`# Extract useful info from HTML content`
			`description = ""`

			`# Looking for meta description`
			`desc_match = re.search(r'<meta\s+name="description"\s+content="([^"]+)"', content, re.IGNORECASE)`
			`if desc_match:`
			`description = desc_match.group(1).strip()`
Debug: Add detailed logging for analysis pipeline 2026-02-09 19:11:34 +01:00			`logger.debug(f" Found meta description: {description[:80]}")`
Improve: Local heuristic-based analysis (no subprocess needed, fast) 2026-02-09 19:05:31 +01:00
			`# Looking for og:description`
			`if not description:`
			`og_desc = re.search(r'<meta\s+property="og:description"\s+content="([^"]+)"', content, re.IGNORECASE)`
			`if og_desc:`
			`description = og_desc.group(1).strip()`
Debug: Add detailed logging for analysis pipeline 2026-02-09 19:11:34 +01:00			`logger.debug(f" Found og:description: {description[:80]}")`
Improve: Local heuristic-based analysis (no subprocess needed, fast) 2026-02-09 19:05:31 +01:00
			`# Looking for first paragraph after title`
			`if not description:`
			`p_match = re.search(r'<p[^>]*>([^<]+)</p>', content, re.IGNORECASE)`
			`if p_match:`
			`description = p_match.group(1).strip()[:200]`

			`# Determine tag based on content + URL + type`
			`tag = "interesting"`
			`summary = ""`

			`if link_type == "GitHub":`
			`tag = "project"`
			`summary = f"GitHub repository: {title}"`
			`# Try to extract more info from README`
			`readme_match = re.search(r'README[^<]</h[1-3]>[^<]<p[^>]*>([^<]+)', content, re.IGNORECASE)`
			`if readme_match:`
			`summary += f". {readme_match.group(1)[:100]}"`

			`elif link_type == "YouTube":`
			`tag = "video"`
			`summary = f"Video: {title}"`
			`if description:`
			`summary += f". {description[:80]}"`

			`elif link_type == "Reddit":`
			`tag = "discussion"`
			`summary = f"Reddit discussion: {title}"`

			`elif link_type == "Medium" or link_type == "Dev.to":`
			`tag = "article"`
			`summary = f"Article: {title}"`
			`if description:`
			`summary += f". {description[:80]}"`

			`elif link_type == "arXiv":`
			`tag = "learning"`
			`summary = f"Research paper: {title}"`
Feat: Add web_fetch, AI analysis (Haiku), and comprehensive logging 2026-02-09 18:46:45 +01:00
			`else:`
Improve: Local heuristic-based analysis (no subprocess needed, fast) 2026-02-09 19:05:31 +01:00			`# Generic web article`
			`tag = "to-read"`
			`summary = title`
			`if description:`
			`summary += f". {description[:100]}"`

			`# Truncate summary to reasonable length`
			`summary = summary[:200]`

Debug: Add detailed logging for analysis pipeline 2026-02-09 19:11:34 +01:00			`logger.info(f" ✓ Analysis complete - Tag: {tag}, Summary: {summary[:60]}")`
Improve: Local heuristic-based analysis (no subprocess needed, fast) 2026-02-09 19:05:31 +01:00
Debug: Add detailed logging for analysis pipeline 2026-02-09 19:11:34 +01:00			`result = {`
Improve: Local heuristic-based analysis (no subprocess needed, fast) 2026-02-09 19:05:31 +01:00			`"summary": summary,`
			`"tag": tag,`
			`"relevance": "relevant"`
			`}`
Debug: Add detailed logging for analysis pipeline 2026-02-09 19:11:34 +01:00			`logger.debug(f" Returning: {result}")`
			`return result`
Feature: AI-powered intelligent summaries with sub-agents (analyze + tag) 2026-02-09 18:56:26 +01:00
Feat: Add web_fetch, AI analysis (Haiku), and comprehensive logging 2026-02-09 18:46:45 +01:00			`except Exception as e:`
Improve: Local heuristic-based analysis (no subprocess needed, fast) 2026-02-09 19:05:31 +01:00			`logger.error(f" Analysis error: {e}")`
Debug: Add detailed logging for analysis pipeline 2026-02-09 19:11:34 +01:00			`import traceback`
			`logger.error(traceback.format_exc())`
Improve: Local heuristic-based analysis (no subprocess needed, fast) 2026-02-09 19:05:31 +01:00			`# Return minimal analysis`
			`return {`
			`"summary": title,`
			`"tag": "interesting",`
			`"relevance": "relevant"`
			`}`
Initial: Link analyzer bot for #remora channel 2026-02-09 18:07:14 +01:00
			`# Send to Tududi inbox`
Feature: AI-powered intelligent summaries with sub-agents (analyze + tag) 2026-02-09 18:56:26 +01:00			`def add_to_tududi(title, url, link_type, summary="", tag=""):`
			`"""Add to Tududi inbox with intelligent summary"""`
Feat: Add web_fetch, AI analysis (Haiku), and comprehensive logging 2026-02-09 18:46:45 +01:00			`logger.debug(f" 📌 Adding to Tududi: {title}")`

Initial: Link analyzer bot for #remora channel 2026-02-09 18:07:14 +01:00			`try:`
			`if not TUDUDI_API_KEY:`
Feat: Add web_fetch, AI analysis (Haiku), and comprehensive logging 2026-02-09 18:46:45 +01:00			`logger.warning(" TUDUDI_API_KEY not set")`
Initial: Link analyzer bot for #remora channel 2026-02-09 18:07:14 +01:00			`return False`

Feature: AI-powered intelligent summaries with sub-agents (analyze + tag) 2026-02-09 18:56:26 +01:00			`# Format the inbox content`
Feat: Add web_fetch, AI analysis (Haiku), and comprehensive logging 2026-02-09 18:46:45 +01:00			`content = f"📌 {link_type}: {title}\n🔗 {url}"`
Feature: AI-powered intelligent summaries with sub-agents (analyze + tag) 2026-02-09 18:56:26 +01:00
			`if summary:`
			`content += f"\n\n💡 Summary:\n{summary}"`

			`if tag:`
			`content += f"\n\n🏷️ Tag: {tag}"`
Initial: Link analyzer bot for #remora channel 2026-02-09 18:07:14 +01:00
			`response = requests.post(`
			`f"{TUDUDI_API_URL}/inbox",`
			`headers={`
			`"Authorization": f"Bearer {TUDUDI_API_KEY}",`
			`"Content-Type": "application/json"`
			`},`
			`json={"content": content},`
			`timeout=5`
			`)`

Feature: AI-powered intelligent summaries with sub-agents (analyze + tag) 2026-02-09 18:56:26 +01:00			`if response.status_code in [200, 201]: # 200 or 201 are both OK`
			`logger.info(f" ✓ Added to Tududi inbox with tag: {tag}")`
Initial: Link analyzer bot for #remora channel 2026-02-09 18:07:14 +01:00			`return True`
			`else:`
Feat: Add web_fetch, AI analysis (Haiku), and comprehensive logging 2026-02-09 18:46:45 +01:00			`logger.warning(f" Tududi error: {response.status_code}")`
Initial: Link analyzer bot for #remora channel 2026-02-09 18:07:14 +01:00			`return False`
			`except Exception as e:`
Feat: Add web_fetch, AI analysis (Haiku), and comprehensive logging 2026-02-09 18:46:45 +01:00			`logger.error(f" Tududi error: {e}")`
Initial: Link analyzer bot for #remora channel 2026-02-09 18:07:14 +01:00			`return False`

			`# Discord bot`
			`intents = discord.Intents.default()`
			`intents.message_content = True`

			`class LinkAnalyzerBot(discord.Client):`
			`async def on_ready(self):`
Feat: Add web_fetch, AI analysis (Haiku), and comprehensive logging 2026-02-09 18:46:45 +01:00			`logger.info(f"✅ Bot logged in as {self.user}")`
			`logger.info(f"📍 Watching channel #remora ({CHANNEL_ID})")`
Initial: Link analyzer bot for #remora channel 2026-02-09 18:07:14 +01:00
			`async def on_message(self, message):`
			`# Ignore bot's own messages`
			`if message.author == self.user:`
			`return`

			`# Only process #remora channel`
			`if message.channel.id != CHANNEL_ID:`
			`return`

			`# Check for URLs`
			`urls = extract_urls(message.content)`
			`if not urls:`
Feat: Add web_fetch, AI analysis (Haiku), and comprehensive logging 2026-02-09 18:46:45 +01:00			`logger.debug(f"No URLs in message from {message.author}")`
Initial: Link analyzer bot for #remora channel 2026-02-09 18:07:14 +01:00			`return`

			`# Skip if already processed`
			`tracker = load_tracker()`
			`if message.id in tracker["processed_message_ids"]:`
Feat: Add web_fetch, AI analysis (Haiku), and comprehensive logging 2026-02-09 18:46:45 +01:00			`logger.debug(f"Skipping already-processed message {message.id}")`
Initial: Link analyzer bot for #remora channel 2026-02-09 18:07:14 +01:00			`return`

Feat: Add web_fetch, AI analysis (Haiku), and comprehensive logging 2026-02-09 18:46:45 +01:00			`logger.info(f"🔗 New link(s) from {message.author}: {message.content}")`
Initial: Link analyzer bot for #remora channel 2026-02-09 18:07:14 +01:00
			`# Process each URL`
			`for url in urls:`
Feat: Add web_fetch, AI analysis (Haiku), and comprehensive logging 2026-02-09 18:46:45 +01:00			`try:`
			`logger.info(f"Processing: {url}")`
			`link_type = detect_link_type(url)`

			`# Fetch content`
			`fetch_result = fetch_url_content(url)`
			`title = fetch_result["title"]`

Feature: AI-powered intelligent summaries with sub-agents (analyze + tag) 2026-02-09 18:56:26 +01:00			`# Analyze content if fetch was successful`
			`analysis_data = None`
Debug: Add detailed logging for analysis pipeline 2026-02-09 19:11:34 +01:00			`logger.debug(f" 📊 Fetch status: {fetch_result['status']}")`

Feature: AI-powered intelligent summaries with sub-agents (analyze + tag) 2026-02-09 18:56:26 +01:00			`if fetch_result["status"] == "ok":`
Debug: Add detailed logging for analysis pipeline 2026-02-09 19:11:34 +01:00			`logger.debug(f" 🔍 Starting analysis...")`
Feature: AI-powered intelligent summaries with sub-agents (analyze + tag) 2026-02-09 18:56:26 +01:00			`analysis_data = analyze_content(url, title, fetch_result.get("content", ""), link_type)`
Debug: Add detailed logging for analysis pipeline 2026-02-09 19:11:34 +01:00			`logger.debug(f" Analysis result: {analysis_data}")`
			`else:`
			`logger.debug(f" ⚠️ Fetch failed, skipping analysis")`
Feature: AI-powered intelligent summaries with sub-agents (analyze + tag) 2026-02-09 18:56:26 +01:00
			`# Prepare summary for Tududi`
			`summary_text = ""`
			`tag = "interesting"`
			`if analysis_data:`
			`summary_text = analysis_data.get("summary", "")`
			`tag = analysis_data.get("tag", "interesting")`
Debug: Add detailed logging for analysis pipeline 2026-02-09 19:11:34 +01:00			`logger.debug(f" ✓ Got summary: {summary_text[:80]}")`
			`else:`
			`logger.warning(f" ❌ No analysis data returned")`
Feat: Add web_fetch, AI analysis (Haiku), and comprehensive logging 2026-02-09 18:46:45 +01:00
Feature: AI-powered intelligent summaries with sub-agents (analyze + tag) 2026-02-09 18:56:26 +01:00			`# Add to Tududi with summary`
			`tududi_ok = add_to_tududi(title, url, link_type, summary_text, tag)`
Feat: Add web_fetch, AI analysis (Haiku), and comprehensive logging 2026-02-09 18:46:45 +01:00
			`# Format response for Discord`
			`response_text = f"📌 {link_type}: {title}"`
Feature: AI-powered intelligent summaries with sub-agents (analyze + tag) 2026-02-09 18:56:26 +01:00			`if summary_text:`
			`response_text += f"\n\n💡 {summary_text}"`
			`if tag:`
			response_text += f"\n\n🏷️ Tag: `{tag}`"
Feat: Add web_fetch, AI analysis (Haiku), and comprehensive logging 2026-02-09 18:46:45 +01:00
			`logger.debug(f"Posting response: {response_text}")`

			`# Post in channel`
			`await message.reply(response_text, mention_author=False)`

			`# Update tracker`
			`tracker["links"].append({`
			`"url": url,`
			`"title": title,`
			`"type": link_type,`
			`"author": str(message.author),`
			`"message_id": message.id,`
			`"date": datetime.now().isoformat(),`
Fix: Variable name analysis_data instead of analysis 2026-02-09 18:59:09 +01:00			`"analysis": analysis_data,`
Feat: Add web_fetch, AI analysis (Haiku), and comprehensive logging 2026-02-09 18:46:45 +01:00			`"tududi": tududi_ok,`
			`"fetch_status": fetch_result["status"]`
			`})`

			`logger.info(f"✓ Processed: {url}")`

			`except Exception as e:`
			`logger.error(f"❌ Error processing {url}: {e}")`
			`await message.reply(f"❌ Error analyzing link: {e}", mention_author=False)`
Initial: Link analyzer bot for #remora channel 2026-02-09 18:07:14 +01:00
			`# Update processed IDs`
			`tracker["processed_message_ids"].append(message.id)`
			`save_tracker(tracker)`
Feat: Add web_fetch, AI analysis (Haiku), and comprehensive logging 2026-02-09 18:46:45 +01:00			`logger.info(f"Updated tracker, total links: {len(tracker['links'])}")`
Initial: Link analyzer bot for #remora channel 2026-02-09 18:07:14 +01:00
			`# Main`
			`if __name__ == "__main__":`
			`token = os.getenv("DISCORD_BOT_TOKEN")`
			`if not token:`
Feat: Add web_fetch, AI analysis (Haiku), and comprehensive logging 2026-02-09 18:46:45 +01:00			`logger.error("❌ DISCORD_BOT_TOKEN not set!")`
Initial: Link analyzer bot for #remora channel 2026-02-09 18:07:14 +01:00			`exit(1)`

Feat: Add web_fetch, AI analysis (Haiku), and comprehensive logging 2026-02-09 18:46:45 +01:00			`logger.info("Starting bot...")`
Initial: Link analyzer bot for #remora channel 2026-02-09 18:07:14 +01:00			`bot = LinkAnalyzerBot(intents=intents)`
			`bot.run(token)`