Files
xtream2m3u/run.py
ovosimpatico d02db1c8e6
Some checks failed
Build and Push Docker Image / build-and-push (push) Failing after 10s
Several performance improvements
2025-08-30 01:38:54 -03:00

727 lines
28 KiB
Python

import fnmatch
import ipaddress
import json
import logging
import os
import re
import socket
import time
import urllib.parse
from concurrent.futures import ThreadPoolExecutor, as_completed
from functools import lru_cache
import dns.resolver
import requests
from fake_useragent import UserAgent
from flask import Flask, Response, request, send_from_directory
# Configure logging
logging.basicConfig(level=logging.WARNING)
logger = logging.getLogger(__name__)
app = Flask(__name__)
@app.route("/")
def serve_frontend():
"""Serve the frontend index.html file"""
return send_from_directory("frontend", "index.html")
@app.route("/assets/<path:filename>")
def serve_assets(filename):
"""Serve assets from the docs/assets directory"""
try:
return send_from_directory("docs/assets", filename)
except:
return "Asset not found", 404
@app.route("/<path:filename>")
def serve_static_files(filename):
"""Serve static files from the frontend directory"""
# Don't serve API routes through static file handler
api_routes = ["m3u", "xmltv", "categories", "image-proxy", "stream-proxy", "assets"]
if filename.split("/")[0] in api_routes:
return "Not found", 404
# Only serve files that exist in the frontend directory
try:
return send_from_directory("frontend", filename)
except:
# If file doesn't exist in frontend, return 404
return "File not found", 404
# Get default proxy URL from environment variable
DEFAULT_PROXY_URL = os.environ.get("PROXY_URL")
# Set up custom DNS resolver
def setup_custom_dns():
"""Configure a custom DNS resolver using reliable DNS services"""
dns_servers = ["1.1.1.1", "1.0.0.1", "8.8.8.8", "8.8.4.4", "9.9.9.9"]
custom_resolver = dns.resolver.Resolver()
custom_resolver.nameservers = dns_servers
original_getaddrinfo = socket.getaddrinfo
def new_getaddrinfo(host, port, family=0, type=0, proto=0, flags=0):
if host:
try:
# Skip DNS resolution for IP addresses
try:
ipaddress.ip_address(host)
# If we get here, the host is already an IP address
logger.debug(f"Host is already an IP address: {host}, skipping DNS resolution")
except ValueError:
# Not an IP address, so use DNS resolution
answers = custom_resolver.resolve(host)
host = str(answers[0])
logger.debug(f"Custom DNS resolved {host}")
except Exception as e:
logger.info(f"Custom DNS resolution failed for {host}: {e}, falling back to system DNS")
return original_getaddrinfo(host, port, family, type, proto, flags)
socket.getaddrinfo = new_getaddrinfo
logger.info("Custom DNS resolver set up")
# Initialize DNS resolver
setup_custom_dns()
# Create a session with connection pooling for better performance
session = requests.Session()
session.mount('http://', requests.adapters.HTTPAdapter(
pool_connections=10,
pool_maxsize=20,
max_retries=3
))
session.mount('https://', requests.adapters.HTTPAdapter(
pool_connections=10,
pool_maxsize=20,
max_retries=3
))
# Common request function with caching for API endpoints
@lru_cache(maxsize=128)
def fetch_api_data(url, timeout=10):
"""Make a request to an API endpoint with caching"""
ua = UserAgent()
headers = {
"User-Agent": ua.chrome,
"Accept": "application/json,text/html,application/xhtml+xml,application/xml;q=0.9,image/webp,*/*;q=0.8",
"Accept-Language": "en-US,en;q=0.5",
"Connection": "keep-alive",
"Accept-Encoding": "gzip, deflate",
}
try:
hostname = urllib.parse.urlparse(url).netloc.split(":")[0]
logger.info(f"Making request to host: {hostname}")
# Use session for connection pooling with streaming for large responses
response = session.get(url, headers=headers, timeout=timeout, stream=True)
response.raise_for_status()
# For large responses, use streaming JSON parsing
try:
# Check content length to decide parsing strategy
content_length = response.headers.get('Content-Length')
if content_length and int(content_length) > 10_000_000: # > 10MB
logger.info(f"Large response detected ({content_length} bytes), using optimized parsing")
# Stream the JSON content for better memory efficiency
response.encoding = 'utf-8' # Ensure proper encoding
return response.json()
except json.JSONDecodeError:
# Fallback to text for non-JSON responses
return response.text
except requests.exceptions.SSLError:
return {"error": "SSL Error", "details": "Failed to verify SSL certificate"}, 503
except requests.exceptions.RequestException as e:
logger.error(f"RequestException: {e}")
return {"error": "Request Exception", "details": str(e)}, 503
def stream_request(url, headers=None, timeout=10):
"""Make a streaming request that doesn't buffer the full response"""
if not headers:
headers = {
"User-Agent": "Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/91.0.4472.124 Safari/537.36"
}
return requests.get(url, stream=True, headers=headers, timeout=timeout)
def encode_url(url):
"""Safely encode a URL for use in proxy endpoints"""
return urllib.parse.quote(url, safe="") if url else ""
def generate_streaming_response(response, content_type=None):
"""Generate a streaming response with appropriate headers"""
if not content_type:
content_type = response.headers.get("Content-Type", "application/octet-stream")
def generate():
try:
bytes_sent = 0
for chunk in response.iter_content(chunk_size=8192):
if chunk:
bytes_sent += len(chunk)
yield chunk
logger.info(f"Stream completed, sent {bytes_sent} bytes")
except Exception as e:
logger.error(f"Streaming error: {str(e)}")
raise
headers = {
"Access-Control-Allow-Origin": "*",
"Content-Type": content_type,
}
# Add content length if available and not using chunked transfer
if "Content-Length" in response.headers and "Transfer-Encoding" not in response.headers:
headers["Content-Length"] = response.headers["Content-Length"]
else:
headers["Transfer-Encoding"] = "chunked"
return Response(generate(), mimetype=content_type, headers=headers, direct_passthrough=True)
@app.route("/image-proxy/<path:image_url>")
def proxy_image(image_url):
"""Proxy endpoint for images to avoid CORS issues"""
try:
original_url = urllib.parse.unquote(image_url)
logger.info(f"Image proxy request for: {original_url}")
response = requests.get(original_url, stream=True, timeout=10)
response.raise_for_status()
content_type = response.headers.get("Content-Type", "")
if not content_type.startswith("image/"):
logger.error(f"Invalid content type for image: {content_type}")
return Response("Invalid image type", status=415)
return generate_streaming_response(response, content_type)
except requests.Timeout:
return Response("Image fetch timeout", status=504)
except requests.HTTPError as e:
return Response(f"Failed to fetch image: {str(e)}", status=e.response.status_code)
except Exception as e:
logger.error(f"Image proxy error: {str(e)}")
return Response("Failed to process image", status=500)
@app.route("/stream-proxy/<path:stream_url>")
def proxy_stream(stream_url):
"""Proxy endpoint for streams"""
try:
original_url = urllib.parse.unquote(stream_url)
logger.info(f"Stream proxy request for: {original_url}")
response = stream_request(original_url)
response.raise_for_status()
# Determine content type
content_type = response.headers.get("Content-Type")
if not content_type:
if original_url.endswith(".ts"):
content_type = "video/MP2T"
elif original_url.endswith(".m3u8"):
content_type = "application/vnd.apple.mpegurl"
else:
content_type = "application/octet-stream"
logger.info(f"Using content type: {content_type}")
return generate_streaming_response(response, content_type)
except requests.Timeout:
return Response("Stream timeout", status=504)
except requests.HTTPError as e:
return Response(f"Failed to fetch stream: {str(e)}", status=e.response.status_code)
except Exception as e:
logger.error(f"Stream proxy error: {str(e)}")
return Response("Failed to process stream", status=500)
def parse_group_list(group_string):
"""Parse a comma-separated string into a list of trimmed strings"""
return [group.strip() for group in group_string.split(",")] if group_string else []
def group_matches(group_title, pattern):
"""Check if a group title matches a pattern, supporting wildcards and exact matching"""
# Convert to lowercase for case-insensitive matching
group_lower = group_title.lower()
pattern_lower = pattern.lower()
# Handle spaces in pattern
if " " in pattern_lower:
# For patterns with spaces, split and check each part
pattern_parts = pattern_lower.split()
group_parts = group_lower.split()
# If pattern has more parts than group, can't match
if len(pattern_parts) > len(group_parts):
return False
# Check each part of the pattern against group parts
for i, part in enumerate(pattern_parts):
if i >= len(group_parts):
return False
if "*" in part or "?" in part:
if not fnmatch.fnmatch(group_parts[i], part):
return False
else:
if part not in group_parts[i]:
return False
return True
# Check for wildcard patterns
if "*" in pattern_lower or "?" in pattern_lower:
return fnmatch.fnmatch(group_lower, pattern_lower)
else:
# Simple substring match for non-wildcard patterns
return pattern_lower in group_lower
def get_required_params():
"""Get and validate the required parameters from the request"""
url = request.args.get("url")
username = request.args.get("username")
password = request.args.get("password")
if not url or not username or not password:
return (
None,
None,
None,
json.dumps({"error": "Missing Parameters", "details": "Required parameters: url, username, and password"}),
400,
)
proxy_url = request.args.get("proxy_url", DEFAULT_PROXY_URL) or request.host_url.rstrip("/")
return url, username, password, proxy_url, None
def validate_xtream_credentials(url, username, password):
"""Validate the Xtream API credentials"""
api_url = f"{url}/player_api.php?username={username}&password={password}"
data = fetch_api_data(api_url)
if isinstance(data, tuple): # Error response
return None, data[0], data[1]
if "user_info" not in data or "server_info" not in data:
return (
None,
json.dumps(
{
"error": "Invalid Response",
"details": "Server response missing required data (user_info or server_info)",
}
),
400,
)
return data, None, None
def fetch_api_endpoint(url_info):
"""Fetch a single API endpoint - used for concurrent requests"""
url, name, timeout = url_info
try:
logger.info(f"🚀 Fetching {name}...")
start_time = time.time()
data = fetch_api_data(url, timeout=timeout)
end_time = time.time()
if isinstance(data, list):
logger.info(f"✅ Completed {name} in {end_time-start_time:.1f}s - got {len(data)} items")
else:
logger.info(f"✅ Completed {name} in {end_time-start_time:.1f}s")
return name, data
except Exception as e:
logger.warning(f"❌ Failed to fetch {name}: {e}")
return name, None
def fetch_categories_and_channels(url, username, password, include_vod=False):
"""Fetch categories and channels from the Xtream API using concurrent requests"""
all_categories = []
all_streams = []
try:
# Prepare all API endpoints to fetch concurrently
api_endpoints = [
(f"{url}/player_api.php?username={username}&password={password}&action=get_live_categories",
"live_categories", 60),
(f"{url}/player_api.php?username={username}&password={password}&action=get_live_streams",
"live_streams", 180),
]
# Add VOD endpoints if requested (WARNING: This will be much slower!)
if include_vod:
logger.warning("⚠️ Including VOD content - this will take significantly longer!")
logger.info("💡 For faster loading, use the API without include_vod=true")
# Only add the most essential VOD endpoints - skip the massive streams for categories-only requests
api_endpoints.extend([
(f"{url}/player_api.php?username={username}&password={password}&action=get_vod_categories",
"vod_categories", 60),
(f"{url}/player_api.php?username={username}&password={password}&action=get_series_categories",
"series_categories", 60),
])
# Only fetch the massive stream lists if explicitly needed for M3U generation
vod_for_m3u = request.endpoint == 'generate_m3u'
if vod_for_m3u:
logger.warning("🐌 Fetching massive VOD/Series streams for M3U generation...")
api_endpoints.extend([
(f"{url}/player_api.php?username={username}&password={password}&action=get_vod_streams",
"vod_streams", 240),
(f"{url}/player_api.php?username={username}&password={password}&action=get_series",
"series", 240),
])
else:
logger.info("⚡ Skipping massive VOD streams for categories-only request")
# Fetch all endpoints concurrently using ThreadPoolExecutor
logger.info(f"Starting concurrent fetch of {len(api_endpoints)} API endpoints...")
results = {}
with ThreadPoolExecutor(max_workers=10) as executor: # Increased workers for better concurrency
# Submit all API calls
future_to_name = {executor.submit(fetch_api_endpoint, endpoint): endpoint[1]
for endpoint in api_endpoints}
# Collect results as they complete
for future in as_completed(future_to_name):
name, data = future.result()
results[name] = data
logger.info("All concurrent API calls completed!")
# Process live categories and streams (required)
live_categories = results.get("live_categories")
live_streams = results.get("live_streams")
if isinstance(live_categories, tuple): # Error response
return None, None, live_categories[0], live_categories[1]
if isinstance(live_streams, tuple): # Error response
return None, None, live_streams[0], live_streams[1]
if not isinstance(live_categories, list) or not isinstance(live_streams, list):
return (
None,
None,
json.dumps(
{
"error": "Invalid Data Format",
"details": "Live categories or streams data is not in the expected format",
}
),
500,
)
# Optimized data processing - batch operations for massive datasets
logger.info("Processing live content...")
# Batch set content_type for live content
if live_categories:
for category in live_categories:
category["content_type"] = "live"
all_categories.extend(live_categories)
if live_streams:
for stream in live_streams:
stream["content_type"] = "live"
all_streams.extend(live_streams)
logger.info(f"✅ Added {len(live_categories)} live categories and {len(live_streams)} live streams")
# Process VOD content if requested and available
if include_vod:
logger.info("Processing VOD content...")
# Process VOD categories
vod_categories = results.get("vod_categories")
if isinstance(vod_categories, list) and vod_categories:
for category in vod_categories:
category["content_type"] = "vod"
all_categories.extend(vod_categories)
logger.info(f"✅ Added {len(vod_categories)} VOD categories")
# Process series categories first (lightweight)
series_categories = results.get("series_categories")
if isinstance(series_categories, list) and series_categories:
for category in series_categories:
category["content_type"] = "series"
all_categories.extend(series_categories)
logger.info(f"✅ Added {len(series_categories)} series categories")
# Only process massive stream lists if they were actually fetched
vod_streams = results.get("vod_streams")
if isinstance(vod_streams, list) and vod_streams:
logger.info(f"🔥 Processing {len(vod_streams)} VOD streams (this is the slow part)...")
# Batch process for better performance
batch_size = 5000
for i in range(0, len(vod_streams), batch_size):
batch = vod_streams[i:i + batch_size]
for stream in batch:
stream["content_type"] = "vod"
if i + batch_size < len(vod_streams):
logger.info(f" Processed {i + batch_size}/{len(vod_streams)} VOD streams...")
all_streams.extend(vod_streams)
logger.info(f"✅ Added {len(vod_streams)} VOD streams")
# Process series (this can also be huge!)
series = results.get("series")
if isinstance(series, list) and series:
logger.info(f"🔥 Processing {len(series)} series (this is also slow)...")
# Batch process for better performance
batch_size = 5000
for i in range(0, len(series), batch_size):
batch = series[i:i + batch_size]
for show in batch:
show["content_type"] = "series"
if i + batch_size < len(series):
logger.info(f" Processed {i + batch_size}/{len(series)} series...")
all_streams.extend(series)
logger.info(f"✅ Added {len(series)} series")
except Exception as e:
logger.error(f"Critical error fetching API data: {e}")
return (
None,
None,
json.dumps(
{
"error": "API Fetch Error",
"details": f"Failed to fetch data from IPTV service: {str(e)}",
}
),
500,
)
logger.info(f"🚀 CONCURRENT FETCH COMPLETE: {len(all_categories)} total categories and {len(all_streams)} total streams")
return all_categories, all_streams, None, None
@app.route("/categories", methods=["GET"])
def get_categories():
"""Get all available categories from the Xtream API"""
# Get and validate parameters
url, username, password, proxy_url, error = get_required_params()
if error:
return error
# Check for VOD parameter - default to false to avoid timeouts (VOD is massive and slow!)
include_vod = request.args.get("include_vod", "false").lower() == "true"
logger.info(f"VOD content requested: {include_vod}")
# Validate credentials
user_data, error_json, error_code = validate_xtream_credentials(url, username, password)
if error_json:
return error_json, error_code, {"Content-Type": "application/json"}
# Fetch categories
categories, channels, error_json, error_code = fetch_categories_and_channels(url, username, password, include_vod)
if error_json:
return error_json, error_code, {"Content-Type": "application/json"}
# Return categories as JSON
return json.dumps(categories), 200, {"Content-Type": "application/json"}
@app.route("/xmltv", methods=["GET"])
def generate_xmltv():
"""Generate a filtered XMLTV file from the Xtream API"""
# Get and validate parameters
url, username, password, proxy_url, error = get_required_params()
if error:
return error
# No filtering supported for XMLTV endpoint
# Validate credentials
user_data, error_json, error_code = validate_xtream_credentials(url, username, password)
if error_json:
return error_json, error_code, {"Content-Type": "application/json"}
# Fetch XMLTV data
base_url = url.rstrip("/")
xmltv_url = f"{base_url}/xmltv.php?username={username}&password={password}"
xmltv_data = fetch_api_data(xmltv_url, timeout=20) # Longer timeout for XMLTV
if isinstance(xmltv_data, tuple): # Error response
return json.dumps(xmltv_data[0]), xmltv_data[1], {"Content-Type": "application/json"}
# If not proxying, return the original XMLTV
if not proxy_url:
return Response(
xmltv_data, mimetype="application/xml", headers={"Content-Disposition": "attachment; filename=guide.xml"}
)
# Replace image URLs in the XMLTV content with proxy URLs
def replace_icon_url(match):
original_url = match.group(1)
proxied_url = f"{proxy_url}/image-proxy/{encode_url(original_url)}"
return f'<icon src="{proxied_url}"'
xmltv_data = re.sub(r'<icon src="([^"]+)"', replace_icon_url, xmltv_data)
# Return the XMLTV data
return Response(
xmltv_data, mimetype="application/xml", headers={"Content-Disposition": "attachment; filename=guide.xml"}
)
@app.route("/m3u", methods=["GET"])
def generate_m3u():
"""Generate a filtered M3U playlist from the Xtream API"""
# Get and validate parameters
url, username, password, proxy_url, error = get_required_params()
if error:
return error
# Parse filter parameters
unwanted_groups = parse_group_list(request.args.get("unwanted_groups", ""))
wanted_groups = parse_group_list(request.args.get("wanted_groups", ""))
no_stream_proxy = request.args.get("nostreamproxy", "").lower() == "true"
include_vod = request.args.get("include_vod", "false").lower() == "true" # Default to false to avoid timeouts
# For M3U generation, warn about VOD performance impact
if include_vod:
logger.warning("⚠️ M3U generation with VOD enabled - expect 2-5 minute generation time!")
else:
logger.info("⚡ M3U generation for live content only - should be fast!")
# Log filter parameters
logger.info(
f"Filter parameters - wanted_groups: {wanted_groups}, unwanted_groups: {unwanted_groups}, include_vod: {include_vod}"
)
# Validate credentials
user_data, error_json, error_code = validate_xtream_credentials(url, username, password)
if error_json:
return error_json, error_code, {"Content-Type": "application/json"}
# Fetch categories and channels
categories, streams, error_json, error_code = fetch_categories_and_channels(url, username, password, include_vod)
if error_json:
return error_json, error_code, {"Content-Type": "application/json"}
# Extract user info and server URL
username = user_data["user_info"]["username"]
password = user_data["user_info"]["password"]
server_url = f"http://{user_data['server_info']['url']}:{user_data['server_info']['port']}"
# Create category name lookup
category_names = {cat["category_id"]: cat["category_name"] for cat in categories}
# Log all available groups
all_groups = set(category_names.values())
logger.info(f"All available groups: {sorted(all_groups)}")
# Generate M3U playlist
m3u_playlist = "#EXTM3U\n"
# Track included groups
included_groups = set()
for stream in streams:
content_type = stream.get("content_type", "live")
# Determine group title based on content type
if content_type == "series":
# For series, use series name as group title
group_title = f"Series - {category_names.get(stream.get('category_id'), 'Uncategorized')}"
stream_name = stream.get("name", "Unknown Series")
else:
# For live and VOD content
group_title = category_names.get(stream.get("category_id"), "Uncategorized")
stream_name = stream.get("name", "Unknown")
# Add content type prefix for VOD
if content_type == "vod":
group_title = f"VOD - {group_title}"
# Handle filtering logic
include_stream = True
if wanted_groups:
# Only include streams from specified groups
include_stream = any(group_matches(group_title, wanted_group) for wanted_group in wanted_groups)
elif unwanted_groups:
# Exclude streams from unwanted groups
include_stream = not any(group_matches(group_title, unwanted_group) for unwanted_group in unwanted_groups)
if include_stream:
included_groups.add(group_title)
# Handle logo URL - proxy only if stream proxying is enabled
original_logo = stream.get("stream_icon", "")
if original_logo and not no_stream_proxy:
logo_url = f"{proxy_url}/image-proxy/{encode_url(original_logo)}"
else:
logo_url = original_logo
# Create the stream URL based on content type
if content_type == "live":
# Live TV streams
stream_url = f"{server_url}/live/{username}/{password}/{stream['stream_id']}.ts"
elif content_type == "vod":
# VOD streams
stream_url = f"{server_url}/movie/{username}/{password}/{stream['stream_id']}.{stream.get('container_extension', 'mp4')}"
elif content_type == "series":
# Series streams - use the first episode if available
if "episodes" in stream and stream["episodes"]:
first_episode = list(stream["episodes"].values())[0][0] if stream["episodes"] else None
if first_episode:
episode_id = first_episode.get("id", stream.get("series_id", ""))
stream_url = f"{server_url}/series/{username}/{password}/{episode_id}.{first_episode.get('container_extension', 'mp4')}"
else:
continue # Skip series without episodes
else:
# Fallback for series without episode data
series_id = stream.get("series_id", stream.get("stream_id", ""))
stream_url = f"{server_url}/series/{username}/{password}/{series_id}.mp4"
# Apply stream proxying if enabled
if not no_stream_proxy:
stream_url = f"{proxy_url}/stream-proxy/{encode_url(stream_url)}"
# Add stream to playlist
m3u_playlist += (
f'#EXTINF:0 tvg-name="{stream_name}" group-title="{group_title}" tvg-logo="{logo_url}",{stream_name}\n'
)
m3u_playlist += f"{stream_url}\n"
# Log included groups after filtering
logger.info(f"Groups included after filtering: {sorted(included_groups)}")
logger.info(f"Groups excluded after filtering: {sorted(all_groups - included_groups)}")
# Determine filename based on content included
filename = "FullPlaylist.m3u" if include_vod else "LiveStream.m3u"
# Return the M3U playlist
return Response(
m3u_playlist, mimetype="audio/x-scpls", headers={"Content-Disposition": f"attachment; filename={filename}"}
)
if __name__ == "__main__":
app.run(debug=True, host="0.0.0.0")