feat: Initial commit - Content Extractor for YouTube, Instagram, and blogs

- YouTube extraction with transcript support - Instagram reel extraction via browser automation - Blog/article web scraping - Auto-save to Obsidian vaults - Smart key point generation - Configurable via .env file - Quick extract shell script Tech stack: Python, requests, beautifulsoup4, playwright, youtube-transcript-api
2026-03-05 13:02:58 +05:30
commit c997e764b5
12 changed files with 1302 additions and 0 deletions
--- a/extract.sh
+++ b/extract.sh
@@ -0,0 +1,25 @@
+#!/bin/bash
+# Content Extractor - Quick extraction script
+# Usage: ./extract.sh <url> [folder]
+
+if [ -z "$1" ]; then
+    echo "Usage: $0 <url> [folder]"
+    echo ""
+    echo "Examples:"
+    echo "  $0 https://youtube.com/watch?v=abc123"
+    echo "  $0 https://instagram.com/reel/xyz789 Learning"
+    echo "  $0 https://medium.com/article Articles"
+    exit 1
+fi
+
+URL="$1"
+FOLDER="${2:-Content Extractor}"
+
+echo "🔥 Content Extractor"
+echo "===================="
+echo "URL: $URL"
+echo "Folder: $FOLDER"
+echo ""
+
+cd "$(dirname "$0")"
+python main.py "$URL" --folder "$FOLDER"