Merge pull request #498 from Guovin/dev

Dev
Guovin · Nov 1, 2024 · 3f3ca2d · 3f3ca2d
2 parents fdd75dd + cc56542
commit 3f3ca2d
Show file tree

Hide file tree

Showing 6 changed files with 97 additions and 39 deletions.
diff --git a/docs/tutorial.md b/docs/tutorial.md
@@ -58,7 +58,7 @@
 
 1. 创建文件
 2. 模板文件命名为 user_demo.txt
-3. 模板文件需要按照（频道分类,#genre#），（频道名称,频道接口）进行编写，注意是英文逗号。
+3. 模板文件需要按照（频道分类,#genre#），（频道名称,频道接口）进行编写，注意是英文逗号。如果需要将该接口设为白名单（不测速、保留在结果最前），可在地址后添加$!即可，例如http://xxx$!。后面也可以添加额外说明信息，如：http://xxx$!白名单接口
 4. 点击 Commit changes...进行保存
 
 ![创建user_demo.txt](./images/edit-user-demo.png '创建user_demo.txt')

diff --git a/docs/tutorial_en.md b/docs/tutorial_en.md
@@ -55,7 +55,7 @@ When you click to confirm and create in step one, you will be automatically redi
 
 1. Create file
 2. Name the template file user_demo.txt
-3. The template file needs to be written in the format of (channel category, #genre#), (channel name, channel interface), note that it is an English comma.
+3. The template file needs to be written in the format of (channel category, #genre#), (channel name, channel interface), note that it is an English comma. If you need to set this interface as a whitelist (no speed testing, kept at the front of the results), simply add $! after the address. For example: http://xxx$!. Additional information can also be appended afterward, such as: http://xxx$! Whitelist interface.
 4. Click Commit changes... to save
 
 ![Create user_demo.txt](./images/edit-user-demo.png 'Create user_demo.txt')

diff --git a/main.py b/main.py
@@ -130,7 +130,7 @@ def pbar_update(self, name=""):
     def get_urls_len(self, filter=False):
         data = copy.deepcopy(self.channel_data)
         if filter:
-            process_nested_dict(data, seen=set(), flag=r"cache:(.*)")
+            process_nested_dict(data, seen=set(), flag=r"cache:(.*)", force_str="!")
         processed_urls = set(
             url_info[0]
             for channel_obj in data.values()

diff --git a/utils/channel.py b/utils/channel.py
@@ -92,9 +92,13 @@ def get_channel_data_from_file(channels, file, use_old):
                 if name not in category_dict:
                     category_dict[name] = []
                 if use_old and url:
-                    info = (url, None, None, None)
-                    if info[0] and info not in category_dict[name]:
-                        category_dict[name].append(info)
+                    info = url.partition("$")[2]
+                    origin = None
+                    if info and info.startswith("!"):
+                        origin = "important"
+                    data = (url, None, None, origin)
+                    if data not in category_dict[name]:
+                        category_dict[name].append(data)
     return channels
 
 
@@ -119,10 +123,17 @@ def get_channel_items():
                 for cate, data in channels.items():
                     if cate in old_result:
                         for name, info_list in data.items():
+                            urls = [
+                                item[0].partition("$")[0]
+                                for item in info_list
+                                if item[0]
+                            ]
                             if name in old_result[cate]:
                                 for info in old_result[cate][name]:
-                                    if info not in info_list:
-                                        channels[cate][name].append(info)
+                                    if info:
+                                        pure_url = info[0].partition("$")[0]
+                                        if pure_url not in urls:
+                                            channels[cate][name].append(info)
     return channels
 
 
@@ -473,17 +484,36 @@ def init_info_data(data, cate, name):
         data[cate][name] = []
 
 
-def append_data_to_info_data(info_data, cate, name, data, origin=None, check=True):
+def append_data_to_info_data(
+    info_data, cate, name, data, origin=None, check=True, insert=False
+):
     """
     Append channel data to total info data
     """
     init_info_data(info_data, cate, name)
+    urls = [x[0].partition("$")[0] for x in info_data[cate][name] if x[0]]
     for item in data:
         try:
             url, date, resolution, *rest = item
-            origin = origin or (rest[0] if rest else None)
-            if (url and not check) or (url and check and check_url_by_patterns(url)):
-                info_data[cate][name].append((url, date, resolution, origin))
+            url_origin = origin or (rest[0] if rest else None)
+            if url:
+                pure_url = url.partition("$")[0]
+                if pure_url in urls:
+                    continue
+                if (
+                    url_origin == "important"
+                    or (not check)
+                    or (check and check_url_by_patterns(pure_url))
+                ):
+                    if insert:
+                        info_data[cate][name].insert(
+                            0, (url, date, resolution, url_origin)
+                        )
+                    else:
+                        info_data[cate][name].append(
+                            (url, date, resolution, url_origin)
+                        )
+                    urls.append(pure_url)
         except:
             continue
 
@@ -499,19 +529,15 @@ def get_origin_method_name(method):
 
 def append_old_data_to_info_data(info_data, cate, name, data):
     """
-    Append old channel data to total info data
+    Append history channel data to total info data
     """
     append_data_to_info_data(
         info_data,
         cate,
         name,
         data,
     )
-    print(name, "old:", len(data), end=", ")
-    print(
-        "total:",
-        len(info_data.get(cate, {}).get(name, [])),
-    )
+    print("History:", len(data), end=", ")
 
 
 def append_total_data(
@@ -537,6 +563,8 @@ def append_total_data(
     for cate, channel_obj in items:
         for name, old_info_list in channel_obj.items():
             print(f"{name}:", end=" ")
+            if constants.open_use_old_result and old_info_list:
+                append_old_data_to_info_data(data, cate, name, old_info_list)
             for method, result in total_result:
                 if constants.open_method[method]:
                     origin_method = get_origin_method_name(method)
@@ -547,8 +575,10 @@ def append_total_data(
                         data, cate, name, name_results, origin=origin_method
                     )
                     print(f"{method.capitalize()}:", len(name_results), end=", ")
-            if constants.open_use_old_result:
-                append_old_data_to_info_data(data, cate, name, old_info_list)
+            print(
+                "total:",
+                len(data.get(cate, {}).get(name, [])),
+            )
     if constants.open_keep_all:
         extra_cate = "📥其它频道"
         for method, result in total_result:
@@ -560,15 +590,20 @@ def append_total_data(
                     if name in names:
                         continue
                     print(f"{name}:", end=" ")
+                    if constants.open_use_old_result:
+                        old_info_list = channel_obj.get(name, [])
+                        if old_info_list:
+                            append_old_data_to_info_data(
+                                data, extra_cate, name, old_info_list
+                            )
                     append_data_to_info_data(
                         data, extra_cate, name, urls, origin=origin_method
                     )
                     print(name, f"{method.capitalize()}:", len(urls), end=", ")
-                    if constants.open_use_old_result:
-                        old_info_list = channel_obj.get(name, [])
-                        append_old_data_to_info_data(
-                            data, extra_cate, name, old_info_list
-                        )
+                    print(
+                        "total:",
+                        len(data.get(cate, {}).get(name, [])),
+                    )
 
 
 async def sort_channel_list(
@@ -624,7 +659,7 @@ async def process_sort_channel_list(data, ipv6=False, callback=None):
     is_ffmpeg = constants.open_ffmpeg and ffmpeg_installed
     semaphore = asyncio.Semaphore(5)
     need_sort_data = copy.deepcopy(data)
-    process_nested_dict(need_sort_data, seen=set(), flag=r"cache:(.*)")
+    process_nested_dict(need_sort_data, seen=set(), flag=r"cache:(.*)", force_str="!")
     tasks = [
         asyncio.create_task(
             sort_channel_list(
@@ -658,7 +693,18 @@ async def process_sort_channel_list(data, ipv6=False, callback=None):
             }
             for url, date, resolution, origin in info_list:
                 if "$" in url:
-                    matcher = re.search(r"cache:(.*)", url)
+                    info = url.partition("$")[2]
+                    if info and info.startswith("!"):
+                        append_data_to_info_data(
+                            sort_data,
+                            cate,
+                            name,
+                            [(url, date, resolution, origin)],
+                            check=False,
+                            insert=True,
+                        )
+                        continue
+                    matcher = re.search(r"cache:(.*)", info)
                     if matcher:
                         cache_key = matcher.group(1)
                         if not cache_key:

diff --git a/utils/constants.py b/utils/constants.py
@@ -192,7 +192,7 @@ def get_resolution_value(resolution_str):
 
 log_path = os.path.join(log_dir, log_file)
 
-url_pattern = r"\b((https?):\/\/)?(\[[0-9a-fA-F:]+\]|([\w-]+\.)+[\w-]+)(:[0-9]{1,5})?(\/[^\s]*)?\b"
+url_pattern = r"((https?):\/\/)?(\[[0-9a-fA-F:]+\]|([\w-]+\.)+[\w-]+)(:[0-9]{1,5})?(\/[^\s]*)?(\$[^\s]+)?"
 
 rtp_pattern = r"^([^,，]+)(?:[,，])?(rtp://.*)$"
 

diff --git a/utils/tools.py b/utils/tools.py
@@ -122,13 +122,20 @@ def get_total_urls_from_info_list(infoList, ipv6=False):
         origin: {"ipv4": [], "ipv6": []} for origin in origin_type_prefer
     }
 
+    total_urls = []
     for url, _, resolution, origin in infoList:
+        if origin == "important":
+            pure_url, _, info = url.partition("$")
+            new_info = info.partition("!")[2]
+            total_urls.append(f"{pure_url}${new_info}" if new_info else pure_url)
+            continue
+
         if constants.open_filter_resolution and resolution:
             resolution_value = get_resolution_value(resolution)
             if resolution_value < constants.min_resolution_value:
                 continue
 
-        if not origin or (origin.lower() not in origin_type_prefer):
+        if not origin or (origin not in origin_type_prefer):
             continue
 
         if origin == "subscribe" and "/rtp/" in url:
@@ -142,7 +149,7 @@ def get_total_urls_from_info_list(infoList, ipv6=False):
             categorized_urls[origin]["ipv6"].append(url)
         else:
             categorized_urls[origin]["ipv4"].append(url)
-    total_urls = []
+
     ipv_num = {
         "ipv4": 0,
         "ipv6": 0,
@@ -380,32 +387,37 @@ def get_result_file_content(show_result=False):
     )
 
 
-def remove_duplicates_from_tuple_list(tuple_list, seen, flag=None):
+def remove_duplicates_from_tuple_list(tuple_list, seen, flag=None, force_str=None):
     """
     Remove duplicates from tuple list
     """
     unique_list = []
     for item in tuple_list:
-        if flag:
-            matcher = re.search(flag, item[0])
-            part = matcher.group(1) if matcher else item[0]
-        else:
-            part = item[0]
+        item_first = item[0]
+        part = item_first
+        if force_str:
+            info = item_first.partition("$")[2]
+            if info and info.startswith(force_str):
+                continue
+        elif flag:
+            matcher = re.search(flag, item_first)
+            if matcher:
+                part = matcher.group(1)
         if part not in seen:
             seen.add(part)
             unique_list.append(item)
     return unique_list
 
 
-def process_nested_dict(data, seen, flag=None):
+def process_nested_dict(data, seen, flag=None, force_str=None):
     """
     Process nested dict
     """
     for key, value in data.items():
         if isinstance(value, dict):
-            process_nested_dict(value, seen, flag)
+            process_nested_dict(value, seen, flag, force_str)
         elif isinstance(value, list):
-            data[key] = remove_duplicates_from_tuple_list(value, seen, flag)
+            data[key] = remove_duplicates_from_tuple_list(value, seen, flag, force_str)
 
 
 url_domain_pattern = re.compile(