Update app.py

2025-03-25 13:59:18 +08:00 · 2025-03-25 13:59:18 +08:00 · 010ceea80e
commit 010ceea80e
parent f7ee6cba5b
1 changed files with 131 additions and 247 deletions
--- a/app.py
+++ b/app.py
@ -1,282 +1,166 @@
 import re
 import requests
 import os
+from collections import defaultdict

-# ========== 配置区域 ==========
+# ================== 配置区域 ==================
+# 需要删除的分组 (这些分组下的频道会被过滤)
+DELETE_GROUPS = ["4K频道", "8K频道"]

-# 定义需要删除的 group-title 属性值
-# 这些分组下的频道将不会出现在最终的 m3u 文件中
-delete_groups = ["4K频道", "8K频道"]
-
-# 定义需要替换为 "地方频道" 的省份
-# 当频道的 group-title 为这些省份时，会根据频道名称是否包含 "卫视" 进行不同处理
-# 若不包含 "卫视"，则将 group-title 替换为 "地方频道"；若包含 "卫视"，则替换为 "卫视频道"
-province_groups = ["北京", "安徽", "甘肃", "广东", "贵州", "海南", "河北", "河南", "黑龙江", "湖北", "湖南",
+# 需要转换为地方频道的省份
+PROVINCE_GROUPS = ["北京", "安徽", "甘肃", "广东", "贵州", "海南", "河北", "河南", "黑龙江", "湖北", "湖南",
                   "吉林", "江苏", "江西", "辽宁", "青海", "山东", "上海", "四川", "云南", "浙江", "重庆", "香港"]

-# 定义需要替换的 group-title 属性值
-# 这里指定了一些旧的 group-title 名称和对应的新名称，程序会将旧名称替换为新名称
-replace_groups = {
+# 分组名称替换规则
+GROUP_REPLACEMENTS = {
    "央视": "央视频道",
    "卫视": "卫视频道",
    "其他": "其他频道"
 }

-# 定义需要删除的频道名称中的字符
-# 这些字符会从频道名称中被移除，以达到清洗频道名称的目的
-delete_chars = ["iHOT-", "NewTV-", "SiTV-", "-HEVC", "-50-FPS", "-高码", "-4K", "-BPTV", "咪咕视频_8M1080_"]
+# 需要删除的频道名称冗余字符
+DELETE_CHARS = ["iHOT-", "NewTV-", "SiTV-", "-HEVC", "-50-FPS", "-高码", "-4K", "-BPTV", "咪咕视频_8M1080_"]

-# 定义最终 group 排序顺序
-# 最终生成的 m3u 文件中，频道分组会按照这个顺序进行排列
-# 未在这个列表中的分组会排在最后，并按分组名称排序
-sort_order = ["收藏频道", "央视频道", "卫视频道", "其他频道", "地方频道"]
+# 最终分组排序规则
+GROUP_ORDER = ["收藏频道", "央视频道", "卫视频道", "其他频道", "地方频道"]

-# 需要下载的 m3u 链接及对应 UA 和名称
-# 每个字典代表一个 m3u 文件的下载信息
-# "name" 是该 m3u 文件的名称，用于日志输出
-# "url" 是 m3u 文件的下载地址
-# "ua" 是请求时使用的 User-Agent
-m3u_list = [
-    {"name": "aktv", "url": "https://gh.tryxd.cn/https://raw.githubusercontent.com/alantang1977/JunTV/refs/heads/main/output/result.m3u", "ua": "okhttp/4.12.0"},
+# 数据源配置 (包含重试机制)
+M3U_SOURCES = [
+    {"name": "aktv", "url": "https://gh.tryxd.cn/https://raw.githubusercontent.com/alantang1977/JunTV/main/output/result.m3u", "ua": "okhttp/4.12.0"},
    {"name": "自用收藏", "url": "http://aktv.space/live.m3u", "ua": "okhttp/4.12.0"},
    {"name": "big", "url": "https://gh.tryxd.cn/https://raw.githubusercontent.com/big-mouth-cn/tv/main/iptv-ok.m3u", "ua": "okhttp/4.12.0"},
    {"name": "xhztv", "url": "http://xhztv.top/new.txt", "ua": "okhttp/4.12.0"},
    {"name": "top", "url": "http://tot.totalh.net/tttt.txt", "ua": "okhttp/4.12.0"},
    {"name": "zbds", "url": "https://live.zbds.top/tv/iptv6.txt", "ua": "okhttp/4.12.0"},
-    {"name": "野火", "url": "https://gh.tryxd.cn/https://raw.githubusercontent.com/tianya7981/jiekou/refs/heads/main/野火959", "ua": "okhttp/4.12.0"},
+    {"name": "野火", "url": "https://gh.tryxd.cn/https://raw.githubusercontent.com/tianya7981/jiekou/main/野火959", "ua": "okhttp/4.12.0"},
    {"name": "jundie", "url": "http://home.jundie.top:81/Cat/tv/live.txt", "ua": "okhttp/4.12.0"},
-    {"name": "MyIPTV", "url": "https://gh.tryxd.cn/https://raw.githubusercontent.com/SPX372928/MyIPTV/master/黑龙江PLTV移动CDN版.txt", "ua": "okhttp/4.12.0"},
-    {"name": "mylist", "url": "https://gh.tryxd.cn/https://raw.githubusercontent.com/yuanzl77/IPTV/main/live.m3u", "ua": "okhttp/4.12.0"},  
-    {"name": "Kimentanm", "url": "https://gh.tryxd.cn/https://raw.githubusercontent.com/Kimentanm/aptv/master/m3u/iptv.m3u", "ua": "okhttp/4.12.0"},
-    {"name": "Chinese", "url": "https://gh.tryxd.cn/https://raw.githubusercontent.com/BurningC4/Chinese-IPTV/master/TV-IPV4.m3u", "ua": "okhttp/4.12.0"},
-    {"name": "kimwang1978", "url": "https://gh.tryxd.cn/https://raw.githubusercontent.com/kimwang1978/collect-tv-txt/main/merged_output_simple.txt", "ua": "okhttp/4.12.0"},
-    {"name": "电视", "url": "https://codeberg.org/sy147258/iptv/raw/branch/main/电视", "ua": "okhttp/4.12.0"},
-    {"name": "Gather", "url": "https://gh.tryxd.cn/https://raw.githubusercontent.com/Guovin/iptv-api/gd/output/result.txt", "ua": "okhttp/4.12.0"},
-    # 可以继续增加
+    {"name": "MyIPTV", "url": "https://gh.tryxd.cn/https://raw.githubusercontent.com/SPX372928/MyIPTV/master/黑龙江PLTV移动CDN版.txt", "ua": "okhttp/4.12.0"}
 ]

-# ========== 功能函数 ==========
-
-def download_m3u(url, ua):
-    """下载 m3u 文件，支持自定义 User-Agent"""
+# ================== 核心功能 ==================
+def robust_download(url, ua, max_retries=3):
+    """带重试机制的下载函数"""
    headers = {'User-Agent': ua}
-    response = requests.get(url, headers=headers)
-    response.raise_for_status()
-    response.encoding = 'utf-8'
-    return response.text
-
-def remove_extm3u_lines(lines):
-    """删除带有 #EXTM3U 的行"""
-    return [line for line in lines if not line.startswith("#EXTM3U")]
-
-def process_m3u(content):
-    """预处理 m3u 内容：清洗、替换、标准化"""
-    # 先删除 #EXTM3U 行
-    lines = remove_extm3u_lines(content.splitlines())
-    processed = []
-    i = 0
-    while i < len(lines):
-        line = lines[i]
-        if line.startswith("#EXTINF"):
-            url_line = lines[i + 1]
-            # 删除不需要的 group
-            if any(group in line for group in delete_groups):
-                i += 2
-                continue
-            # 替换 group-title
-            for old, new in replace_groups.items():
-                line = line.replace(f'group-title="{old}"', f'group-title="{new}"')
-            # 省份处理
-            for province in province_groups:
-                if f'group-title="{province}"' in line:
-                    line = line.replace(f'group-title="{province}"', 'group-title="地方频道"') if "卫视" not in line else line.replace(f'group-title="{province}"', 'group-title="卫视频道"')
-            # 特殊频道修正
-            if "凤凰卫视" in line:
-                line = line.replace('group-title="地方频道"', 'group-title="卫视频道"')
-            if "SiTV-" in line:
-                line = line.replace('group-title="地方频道"', 'group-title="SiTV"')
-            # 删除无用字符
-            for char in delete_chars:
-                line = line.replace(char, "")
-            # CCTV 标准化
-            line = re.sub(r'cctv-?', 'CCTV', line, flags=re.IGNORECASE)
-            # 替换 i.880824.xyz 为 192.168.31.2
-            url_line = url_line.replace("i.880824.xyz", "192.168.31.2")
-            # 添加处理后频道
-            processed.append(line)
-            processed.append(url_line)
-            i += 2
-        else:
-            processed.append(line)
-            i += 1
-    return processed
-
-def merge_m3u(all_m3u_lists):
-    """合并所有 m3u 列表，并删除空行"""
-    merged = []
-    for m3u_list in all_m3u_lists:
-        merged.extend(m3u_list)
-    # 删除空行
-    merged = [line for line in merged if line.strip()]
-    return merged
-
-def sort_m3u(lines):
-    """按 group-title 排序，未包含的组排最后"""
-    sorted_result = []
-    remaining_lines = lines[:]
-    remaining_groups = {}
-
-    for group in sort_order:
-        i = 0
-        while i < len(remaining_lines):
-            if remaining_lines[i].startswith("#EXTINF") and f'group-title="{group}"' in remaining_lines[i]:
-                sorted_result.append(remaining_lines[i])
-                sorted_result.append(remaining_lines[i + 1])
-                del remaining_lines[i:i + 2]
-            else:
-                i += 1
-
-    # 处理未在 sort_order 中的分组
-    i = 0
-    while i < len(remaining_lines):
-        if remaining_lines[i].startswith("#EXTINF"):
-            group_match = re.search(r'group-title="([^"]+)"', remaining_lines[i])
-            if group_match:
-                group = group_match.group(1)
-                if group not in remaining_groups:
-                    remaining_groups[group] = []
-                remaining_groups[group].extend([remaining_lines[i], remaining_lines[i + 1]])
-            i += 2
-        else:
-            i += 1
-
-    # 按分组名称排序未在 sort_order 中的分组
-    for group in sorted(remaining_groups.keys()):
-        sorted_result.extend(remaining_groups[group])
-
-    return sorted_result
-
-def sort_channels_in_groups(lines):
-    """将每个分组中相同的频道名称放在一起，分组内按默认顺序排序"""
-    grouped_channels = {}
-    i = 0
-    while i < len(lines):
-        if lines[i].startswith("#EXTINF"):
-            group_match = re.search(r'group-title="([^"]+)"', lines[i])
-            if group_match:
-                group = group_match.group(1)
-                channel_name = re.search(r',([^,]+)$', lines[i]).group(1)
-                if group not in grouped_channels:
-                    grouped_channels[group] = {}
-                if channel_name not in grouped_channels[group]:
-                    grouped_channels[group][channel_name] = []
-                grouped_channels[group][channel_name].extend([lines[i], lines[i + 1]])
-            i += 2
-        else:
-            i += 1
-
-    sorted_lines = []
-    for group in sort_order:
-        if group in grouped_channels:
-            for channel_name in grouped_channels[group]:
-                sorted_lines.extend(grouped_channels[group][channel_name])
-
-    # 处理未在 sort_order 中的分组
-    remaining_groups = [group for group in grouped_channels if group not in sort_order]
-    for group in sorted(remaining_groups):
-        for channel_name in grouped_channels[group]:
-            sorted_lines.extend(grouped_channels[group][channel_name])
-
-    return sorted_lines
-
-def save_m3u(lines, filename):
-    """保存 m3u 文件"""
-    with open(filename, 'w', encoding='utf-8') as f:
-        f.write("\n".join(lines))
-
-# ========== 主流程 ==========
-def save_txt(lines, filename):
-    """保存为 live.txt 格式（格式：分组名称,频道名称,URL）"""
-    try:
-        with open(filename, 'w', encoding='utf-8') as f:
-            i = 0
-            channel_count = 0  # 频道计数器
-            while i < len(lines):
-                # 严格匹配 #EXTINF 行
-                if lines[i].startswith("#EXTINF"):
-                    # 提取分组名称
-                    group_match = re.search(r'group-title="([^"]+)"', lines[i])
-                    group = group_match.group(1) if group_match else "未知分组"
-                    
-                    # 提取频道名称（兼容含逗号的复杂名称）
-                    channel_name = re.split(r',(?![^"]*\"\,)', lines[i])[-1].strip()
-                    
-                    # 获取URL并校验索引
-                    if i+1 < len(lines) and not lines[i+1].startswith("#"):
-                        url = lines[i+1].strip()
-                        f.write(f"{group},{channel_name},{url}\n")
-                        channel_count += 1
-                    else:
-                        print(f"⚠️ 第 {i+1} 行URL格式错误，已跳过")
-                    i += 2
-                else:
-                    # 跳过非频道行（如#EXTVLCOPT）
-                    i += 1
-            print(f"✅ 成功写入 {channel_count} 个频道到 {filename}")
-    except PermissionError:
-        print(f"❌ 致命错误：无权限写入文件 {filename}")
-        exit(1)
-    except Exception as e:
-        print(f"❌ 文件保存失败：{str(e)}")
-        exit(1)
-      
-def main():
-    all_processed_m3u = []
-
-    # 下载并处理所有 m3u 文件
-    for idx, item in enumerate(m3u_list, start=1):
-        name = item["name"]
-        url = item["url"]
-        ua = item["ua"]
-        print(f"正在处理: {name} ({url}) (UA: {ua})")
-
+    for attempt in range(max_retries):
        try:
-            raw_content = download_m3u(url, ua)
-            processed = process_m3u(raw_content)
-            all_processed_m3u.append(processed)
-            print(f"成功处理第 {idx} 个 m3u，频道数：{len(processed)//2}")
+            response = requests.get(url, headers=headers, timeout=15)
+            response.raise_for_status()
+            response.encoding = response.apparent_encoding  # 自动检测编码
+            return response.text
        except Exception as e:
-            print(f"⚠️ 下载或处理失败：{url}, 错误：{e}")
+            if attempt == max_retries - 1:
+                raise
+            print(f"正在重试 {url} (第 {attempt+1} 次)")

-    # 合并所有列表
-    merged_m3u = merge_m3u(all_processed_m3u)
-    print(f"共合并频道数：{len(merged_m3u)//2}")
+def process_channel(line):
+    """频道信息处理流水线"""
+    # 过滤不需要的分组
+    if any(f'group-title="{g}"' in line for g in DELETE_GROUPS):
+        return None

-    # 全局排序
-    sorted_m3u = sort_m3u(merged_m3u)
+    # 分组名称替换
+    for old, new in GROUP_REPLACEMENTS.items():
+        line = line.replace(f'group-title="{old}"', f'group-title="{new}"')

-    # 对每个分组内的频道进行排序
-    sorted_channels = sort_channels_in_groups(sorted_m3u)
+    # 省份频道处理
+    for province in PROVINCE_GROUPS:
+        if f'group-title="{province}"' in line:
+            new_group = '地方频道' if "卫视" not in line else '卫视频道'
+            line = line.replace(f'group-title="{province}"', f'group-title="{new_group}"')

-    # 保存最终文件
-    output_file = "live.m3u"
-    save_m3u(sorted_channels, output_file)
-    print(f"✅ 最终合并排序文件已保存为 {output_file}")
+    # 特殊频道修正
+    if "凤凰卫视" in line:
+        line = line.replace('group-title="地方频道"', 'group-title="卫视频道"')

-    # 新增：在保存前验证数据有效性
-    if len(sorted_channels) == 0:
-        print("❌ 错误：sorted_channels 为空，无法生成文件")
-        exit(1)
-    else:
-        print(f"调试信息：首个频道数据 -> {sorted_channels[0]}")
+    # 清洗频道名称
+    for char in DELETE_CHARS:
+        line = line.replace(char, "")
+    
+    # 标准化CCTV写法
+    line = re.sub(r'cctv-?', 'CCTV', line, flags=re.IGNORECASE)
+    
+    return line

-    # 保存最终文件
-    output_file = "live.m3u"
-    save_m3u(sorted_channels, output_file)
-    print(f"✅ M3U文件已保存为 {output_file}")
+def parse_m3u(content):
+    """解析M3U内容并结构化存储"""
+    channels = []
+    current_channel = {}
+    
+    for line in content.splitlines():
+        line = line.strip()
+        if line.startswith("#EXTINF"):
+            current_channel = {"meta": line, "url": ""}
+        elif line.startswith("http"):
+            current_channel["url"] = line
+            channels.append(current_channel)
+            current_channel = {}
+    return channels

-    # 保存为TXT格式（增强版）
-    save_txt(sorted_channels, "live.txt") 
+def generate_output(channels):
+    """生成排序后的最终内容"""
+    # 按分组归类
+    group_dict = defaultdict(list)
+    for channel in channels:
+        if match := re.search(r'group-title="([^"]+)"', channel["meta"]):
+            group = match.group(1)
+            group_dict[group].append(channel)
+
+    # 按自定义顺序排序
+    ordered_groups = []
+    for group in GROUP_ORDER:
+        if group in group_dict:
+            ordered_groups.append((group, group_dict.pop(group)))
+    
+    # 添加剩余分组并按字母排序
+    for group in sorted(group_dict.keys()):
+        ordered_groups.append((group, group_dict[group]))
+
+    # 生成最终文本
+    output = ["#EXTM3U"]
+    for group, items in ordered_groups:
+        for item in items:
+            output.append(item["meta"])
+            output.append(item["url"])
+    return "\n".join(output)
+
+def main():
+    """主工作流程"""
+    all_channels = []
+    
+    print("开始下载和处理数据源...")
+    for source in M3U_SOURCES:
+        try:
+            content = robust_download(source["url"], source["ua"])
+            channels = parse_m3u(content)
+            
+            processed = []
+            for ch in channels:
+                if cleaned_meta := process_channel(ch["meta"]):
+                    processed.append({"meta": cleaned_meta, "url": ch["url"]})
+            
+            all_channels.extend(processed)
+            print(f"[✓] 成功处理 {source['name']} ({len(processed)} 个频道)")
+        except Exception as e:
+            print(f"[×] 处理 {source['name']} 失败: {str(e)}")
+    
+    print("生成最终文件...")
+    final_content = generate_output(all_channels)
+    
+    try:
+        with open("live.txt", "w", encoding="utf-8") as f:
+            f.write(final_content)
+        print("生成 live.txt 成功！")
+    except Exception as e:
+        print(f"生成 live.txt 失败: {str(e)}")
+    
+    try:
+        with open("live.m3u", "w", encoding="utf-8") as f:
+            f.write(final_content)
+        print("生成 live.m3u 成功！")
+    except Exception as e:
+        print(f"生成 live.m3u 失败: {str(e)}")
+    
+    print(f"共处理 {len(all_channels)} 个频道，文件大小: {len(final_content)//1024}KB")

 if __name__ == "__main__":
    main()