Add files via upload

githubasr2001 · web-flow · commit 6681a89ec0d7 · 2024-10-02T23:53:52.000-05:00
diff --git a/app.py b/app.py
@@ -0,0 +1,39 @@
+from flask import Flask, render_template, request, jsonify
+import os
+import subprocess
+
+app = Flask(__name__)
+
+@app.route('/')
+def index():
+    return render_template('index.html')
+
+@app.route('/analyze', methods=['POST'])
+def analyze():
+    youtube_url = request.form['youtube_url']
+    
+    # Call the YouTube frame extractor script
+    subprocess.run(['python', 'youtube_frame_extractor.py', youtube_url])
+    
+    # Run analysis scripts
+    subprocess.run(['python', 'color_analysis.py'])
+    subprocess.run(['python', 'face_detection.py'])
+    subprocess.run(['python', 'scene_change_detection.py'])
+    
+    # Prepare results
+    results = {
+        'color_analysis': get_file_content('results/color_analysis/color_analysis_results.txt'),
+        'face_detection': get_file_content('results/face_detection/face_detection_results.txt'),
+        'scene_change': get_file_content('results/scene_change/scene_change_results.txt')
+    }
+    
+    return render_template('results.html', results=results)
+
+def get_file_content(file_path):
+    if os.path.exists(file_path):
+        with open(file_path, 'r') as file:
+            return file.read()
+    return "Analysis results not available."
+
+if __name__ == '__main__':
+    app.run(debug=True)
diff --git a/color_analysis.py b/color_analysis.py
@@ -0,0 +1,41 @@
+import os
+import cv2
+from collections import Counter
+
+# Function to get the dominant color
+def get_dominant_color(frame):
+    img = cv2.resize(frame, (100, 100))
+    pixels = img.reshape(-1, 3)
+
+    color_count = Counter(map(tuple, pixels))
+    dominant_color = color_count.most_common(1)[0][0]
+
+    return dominant_color
+
+# Analyze frames and categorize by dominant color
+def analyze_frames():
+    frame_folder = 'frames'
+    result_dir = 'results/color_analysis'
+    os.makedirs(result_dir, exist_ok=True)  # Create results directory if it doesn't exist
+
+    color_categorized_frames = {}
+
+    for filename in os.listdir(frame_folder):
+        if filename.endswith('.jpg'):
+            frame_path = os.path.join(frame_folder, filename)
+            frame = cv2.imread(frame_path)
+
+            # Get dominant color
+            dominant_color = get_dominant_color(frame)
+
+            if dominant_color not in color_categorized_frames:
+                color_categorized_frames[dominant_color] = []
+            color_categorized_frames[dominant_color].append(frame_path)
+
+    # Save results to a text file in the specific results folder
+    with open(os.path.join(result_dir, 'color_analysis_results.txt'), 'w') as f:
+        for color, frames in color_categorized_frames.items():
+            f.write(f"Color (RGB): {color}, Number of Frames: {len(frames)}\n")
+
+if __name__ == "__main__":
+    analyze_frames()
diff --git a/face_detection.py b/face_detection.py
@@ -0,0 +1,38 @@
+import os
+import cv2
+
+# Load the pre-trained Haar Cascade model for face detection
+face_cascade = cv2.CascadeClassifier(cv2.data.haarcascades + 'haarcascade_frontalface_default.xml')
+
+# Function to detect faces in a frame
+def detect_faces(frame):
+    gray = cv2.cvtColor(frame, cv2.COLOR_BGR2GRAY)
+    faces = face_cascade.detectMultiScale(gray, scaleFactor=1.1, minNeighbors=5)
+    return len(faces) > 0  # Return True if faces are detected
+
+# Analyze frames based on face detection
+def analyze_frames():
+    frame_folder = 'frames'
+    result_dir = 'results/face_detection'
+    os.makedirs(result_dir, exist_ok=True)  # Create results directory if it doesn't exist
+
+    face_categorized_frames = {'with_faces': [], 'without_faces': []}
+
+    for filename in os.listdir(frame_folder):
+        if filename.endswith('.jpg'):
+            frame_path = os.path.join(frame_folder, filename)
+            frame = cv2.imread(frame_path)
+
+            # Check for faces in the frame
+            if detect_faces(frame):
+                face_categorized_frames['with_faces'].append(frame_path)
+            else:
+                face_categorized_frames['without_faces'].append(frame_path)
+
+    # Save results to a text file in the specific results folder
+    with open(os.path.join(result_dir, 'face_detection_results.txt'), 'w') as f:
+        for category, frames in face_categorized_frames.items():
+            f.write(f"Category: {category}, Number of Frames: {len(frames)}\n")
+
+if __name__ == "__main__":
+    analyze_frames()
diff --git a/readme.md b/readme.md
@@ -0,0 +1 @@
+# Youtube-Frame-Extraction
diff --git a/requirements.txt b/requirements.txt
@@ -0,0 +1,8 @@
+yt-dlp 
+opencv-python 
+selenium
+selenium
+yt-dlp
+opencv-python
+webdriver-manager
+flask
diff --git a/scene_change_detection.py b/scene_change_detection.py
@@ -0,0 +1,33 @@
+import cv2
+import os
+
+def scene_change_detection():
+    frame_folder = 'frames'
+    result_dir = 'results/scene_change'
+    os.makedirs(result_dir, exist_ok=True)
+
+    previous_frame = None
+    scene_changes = []
+
+    for filename in sorted(os.listdir(frame_folder)):
+        if filename.endswith('.jpg'):
+            frame_path = os.path.join(frame_folder, filename)
+            frame = cv2.imread(frame_path)
+            gray_frame = cv2.cvtColor(frame, cv2.COLOR_BGR2GRAY)
+
+            if previous_frame is not None:
+                diff = cv2.absdiff(previous_frame, gray_frame)
+                non_zero_count = cv2.countNonZero(diff)
+
+                # Threshold for significant scene change
+                if non_zero_count > 10000:  # Adjust threshold as needed
+                    scene_changes.append(frame_path)
+
+            previous_frame = gray_frame
+
+    with open(os.path.join(result_dir, 'scene_change_results.txt'), 'w') as f:
+        for scene in scene_changes:
+            f.write(f"Scene Change Detected: {scene}\n")
+
+if __name__ == "__main__":
+    scene_change_detection()
diff --git a/templates/index.html b/templates/index.html
@@ -0,0 +1,52 @@
+<!DOCTYPE html>
+<html lang="en">
+<head>
+    <meta charset="UTF-8">
+    <meta name="viewport" content="width=device-width, initial-scale=1.0">
+    <title>YouTube Video Analysis</title>
+    <style>
+        body {
+            font-family: Arial, sans-serif;
+            line-height: 1.6;
+            margin: 0;
+            padding: 20px;
+            background-color: #f4f4f4;
+        }
+        .container {
+            max-width: 800px;
+            margin: auto;
+            background: white;
+            padding: 20px;
+            border-radius: 5px;
+            box-shadow: 0 0 10px rgba(0,0,0,0.1);
+        }
+        h1 {
+            color: #333;
+        }
+        input[type="text"] {
+            width: 100%;
+            padding: 10px;
+            margin-bottom: 10px;
+        }
+        button {
+            background-color: #4CAF50;
+            color: white;
+            padding: 10px 15px;
+            border: none;
+            cursor: pointer;
+        }
+        button:hover {
+            background-color: #45a049;
+        }
+    </style>
+</head>
+<body>
+    <div class="container">
+        <h1>YouTube Video Analysis</h1>
+        <form action="{{ url_for('analyze') }}" method="post">
+            <input type="text" name="youtube_url" placeholder="Enter YouTube video URL" required>
+            <button type="submit">Start Analysis</button>
+        </form>
+    </div>
+</body>
+</html>
diff --git a/templates/results.html b/templates/results.html
@@ -0,0 +1,60 @@
+<!DOCTYPE html>
+<html lang="en">
+<head>
+    <meta charset="UTF-8">
+    <meta name="viewport" content="width=device-width, initial-scale=1.0">
+    <title>Analysis Results</title>
+    <style>
+        body {
+            font-family: Arial, sans-serif;
+            line-height: 1.6;
+            margin: 0;
+            padding: 20px;
+            background-color: #f4f4f4;
+        }
+        .container {
+            max-width: 800px;
+            margin: auto;
+            background: white;
+            padding: 20px;
+            border-radius: 5px;
+            box-shadow: 0 0 10px rgba(0,0,0,0.1);
+        }
+        h1, h2 {
+            color: #333;
+        }
+        .result-section {
+            background-color: #e9e9e9;
+            padding: 10px;
+            margin-bottom: 20px;
+            border-radius: 3px;
+        }
+        pre {
+            white-space: pre-wrap;
+            word-wrap: break-word;
+        }
+    </style>
+</head>
+<body>
+    <div class="container">
+        <h1>Analysis Results</h1>
+        
+        <div class="result-section">
+            <h2>Color Analysis</h2>
+            <pre>{{ results.color_analysis }}</pre>
+        </div>
+        
+        <div class="result-section">
+            <h2>Face Detection</h2>
+            <pre>{{ results.face_detection }}</pre>
+        </div>
+        
+        <div class="result-section">
+            <h2>Scene Change Detection</h2>
+            <pre>{{ results.scene_change }}</pre>
+        </div>
+        
+        <a href="{{ url_for('index') }}">Analyze Another Video</a>
+    </div>
+</body>
+</html>
diff --git a/youtube_frame_extractor.py b/youtube_frame_extractor.py
@@ -0,0 +1,97 @@
+import os
+import cv2
+import time
+import yt_dlp as youtube_dl
+from selenium import webdriver
+from selenium.webdriver.chrome.service import Service
+from selenium.webdriver.common.by import By
+from selenium.webdriver.chrome.options import Options
+from webdriver_manager.chrome import ChromeDriverManager
+
+# Function to set up Selenium and handle ads on YouTube
+def setup_selenium_and_skip_ads(youtube_url):
+    # Configure Selenium options (headless for background operation)
+    chrome_options = Options()
+    chrome_options.add_argument("--headless")
+    chrome_options.add_argument("--disable-gpu")
+    chrome_options.add_argument("--no-sandbox")
+    chrome_options.add_argument("--disable-dev-shm-usage")
+
+    # Set up Selenium WebDriver (automatically downloads the correct ChromeDriver)
+    driver = webdriver.Chrome(service=Service(ChromeDriverManager().install()), options=chrome_options)
+
+    # Open YouTube URL
+    driver.get(youtube_url)
+    
+    # Wait for ads (you can adjust this wait time depending on the network speed)
+    time.sleep(10)
+
+    # Check if there is a "Skip Ad" button
+    try:
+        skip_button = driver.find_element(By.CLASS_NAME, "ytp-ad-skip-button")
+        if skip_button:
+            skip_button.click()
+            print("Ad skipped")
+    except:
+        print("No skippable ad found or already skipped")
+
+    # Get the current URL after ads (if redirected)
+    current_url = driver.current_url
+
+    # Close the browser after handling the ad
+    driver.quit()
+
+    return current_url
+
+# Function to download the video using yt-dlp
+def download_youtube_video(youtube_url):
+    ydl_opts = {
+        'format': 'best',  # Get the best quality video
+        'outtmpl': 'video.mp4',  # Name of the downloaded video
+    }
+    with youtube_dl.YoutubeDL(ydl_opts) as ydl:
+        ydl.download([youtube_url])
+
+# Function to extract frames using OpenCV
+def extract_frames(video_path, output_folder):
+    if not os.path.exists(output_folder):
+        os.makedirs(output_folder)
+
+    cap = cv2.VideoCapture(video_path)
+    frame_count = 0
+
+    while True:
+        ret, frame = cap.read()
+        if not ret:
+            break
+
+        # Save each frame as an image
+        frame_path = os.path.join(output_folder, f"frame_{frame_count:05d}.jpg")
+        cv2.imwrite(frame_path, frame)
+
+        frame_count += 1
+
+    cap.release()
+    print(f"Extracted {frame_count} frames.")
+
+# Main flow
+def main(youtube_url):
+    print("Processing YouTube video...")
+
+    # Step 1: Handle YouTube ads and get the final video URL
+    processed_url = setup_selenium_and_skip_ads(youtube_url)
+
+    # Step 2: Download the video using yt-dlp
+    print(f"Downloading video from: {processed_url}")
+    download_youtube_video(processed_url)
+
+    # Step 3: Extract frames from the downloaded video
+    print("Extracting frames from video...")
+    extract_frames('video.mp4', 'frames')
+
+    print("Process completed.")
+
+# Example usage
+if __name__ == "__main__":
+    youtube_video_url = "https://www.youtube.com/watch?v=7Y5q41D8_hs"  # Replace with your video URL
+    main(youtube_video_url)