From dcd5f7996e94644a2b77b6867b04b3b1b9cd00e6 Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?=E2=80=98dalvqw=E2=80=99?= <‘1297762043@qq.com’>
Date: Sun, 14 May 2023 12:51:33 +0800
Subject: [PATCH 1/4] =?UTF-8?q?=E5=A2=9E=E5=8A=A0=E6=89=B9=E9=87=8F?=
 =?UTF-8?q?=E6=80=BB=E7=BB=93=E9=9F=B3=E8=A7=86=E9=A2=91=E7=9A=84=E5=8A=9F?=
 =?UTF-8?q?=E8=83=BD?=
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

---
 crazy_functional.py            |  10 +++
 crazy_functions/crazy_utils.py |  37 +++++++++
 crazy_functions/总结音视频.py  | 138 +++++++++++++++++++++++++++++++++
 3 files changed, 185 insertions(+)
 create mode 100644 crazy_functions/总结音视频.py

diff --git a/crazy_functional.py b/crazy_functional.py
index 3e7b12f..f6b7253 100644
--- a/crazy_functional.py
+++ b/crazy_functional.py
@@ -246,5 +246,15 @@ def get_crazy_functions():
             "Function": HotReload(图片生成)
         },
     })
+    from crazy_functions.总结音视频 import 总结音视频
+    function_plugins.update({
+        "批量总结音视频（输入路径或上传压缩包）": {
+            "Color": "stop",
+            "AsButton": False,
+            "AdvancedArgs": True,
+            "ArgsReminder": "调用openai api 使用whisper-1模型, 目前支持的格式:mp4, m4a, wav, mpga, mpeg, mp3, 此处无需输入参数",
+            "Function": HotReload(总结音视频)
+        }
+    })
     ###################### 第n组插件 ###########################
     return function_plugins
diff --git a/crazy_functions/crazy_utils.py b/crazy_functions/crazy_utils.py
index e54136c..3570ca9 100644
--- a/crazy_functions/crazy_utils.py
+++ b/crazy_functions/crazy_utils.py
@@ -606,3 +606,40 @@ def get_files_from_everything(txt, type): # type='.md'
         success = False
 
     return success, file_manifest, project_folder
+
+
+def split_audio_file(filename, split_duration=1000):
+    """
+    根据给定的切割时长将音频文件切割成多个片段。
+
+    Args:
+        filename (str): 需要被切割的音频文件名。
+        split_duration (int, optional): 每个切割音频片段的时长（以秒为单位）。默认值为1000。
+
+    Returns:
+        filelist (list): 一个包含所有切割音频片段文件路径的列表。
+
+    """
+    from moviepy.editor import AudioFileClip
+    import os
+    os.makedirs('gpt_log/mp3/cut/', exist_ok=True)  # 创建存储切割音频的文件夹
+
+    # 读取音频文件
+    audio = AudioFileClip(filename)
+
+    # 计算文件总时长和切割点
+    total_duration = audio.duration
+    split_points = list(range(0, int(total_duration), split_duration))
+    split_points.append(int(total_duration))
+    filelist = []
+
+    # 切割音频文件
+    for i in range(len(split_points) - 1):
+        start_time = split_points[i]
+        end_time = split_points[i + 1]
+        split_audio = audio.subclip(start_time, end_time)
+        split_audio.write_audiofile(f"gpt_log/mp3/cut/{filename[0]}_{i}.mp3")
+        filelist.append(f"gpt_log/mp3/cut/{filename[0]}_{i}.mp3")
+
+    audio.close()
+    return filelist
\ No newline at end of file
diff --git a/crazy_functions/总结音视频.py b/crazy_functions/总结音视频.py
new file mode 100644
index 0000000..e391061
--- /dev/null
+++ b/crazy_functions/总结音视频.py
@@ -0,0 +1,138 @@
+from toolbox import CatchException, report_execption, select_api_key, update_ui, write_results_to_file
+from .crazy_utils import request_gpt_model_in_new_thread_with_ui_alive, split_audio_file
+
+
+def AnalyAudio(file_manifest, llm_kwargs, chatbot, history):
+    import os, requests
+    from moviepy.editor import AudioFileClip
+    from request_llm.bridge_all import model_info
+
+    # 设置OpenAI密钥和模型
+    api_key = select_api_key(llm_kwargs['api_key'], llm_kwargs['llm_model'])
+    chat_endpoint = model_info[llm_kwargs['llm_model']]['endpoint']
+
+    whisper_endpoint = chat_endpoint.replace('chat/completions', 'audio/transcriptions')
+    url = whisper_endpoint
+    headers = {
+        'Authorization': f"Bearer {api_key}"
+    }
+
+    os.makedirs('gpt_log/mp3/', exist_ok=True)
+    for index, fp in enumerate(file_manifest):
+        audio_history = []
+        # 提取文件扩展名
+        ext = os.path.splitext(fp)[1]
+        # 提取视频中的音频
+        if ext not in [".mp3", ".wav", ".m4a", ".mpga"]:
+            audio_clip = AudioFileClip(fp)
+            audio_clip.write_audiofile(f'gpt_log/mp3/output{index}.mp3')
+            fp = f'gpt_log/mp3/output{index}.mp3'
+        # 调用whisper模型音频转文字
+        voice = split_audio_file(fp)
+        for j, i in enumerate(voice):
+            with open(i, 'rb') as f:
+                file_content = f.read()  # 读取文件内容到内存
+                files = {
+                    'file': (os.path.basename(i), file_content),
+                }
+                data = {
+                    "model": "whisper-1",
+                    'response_format': "text"
+                }
+            response = requests.post(url, headers=headers, files=files, data=data).text
+
+            i_say = f'请对下面的文章片段做概述，文章内容是 ```{response}```'
+            i_say_show_user = f'第{index + 1}段音频的第{j + 1} / {len(voice)}片段。'
+            gpt_say = yield from request_gpt_model_in_new_thread_with_ui_alive(
+                inputs=i_say,
+                inputs_show_user=i_say_show_user,
+                llm_kwargs=llm_kwargs,
+                chatbot=chatbot,
+                history=[],
+                sys_prompt="总结文章。"
+            )
+
+            chatbot[-1] = (i_say_show_user, gpt_say)
+            history.extend([i_say_show_user, gpt_say])
+            audio_history.extend([i_say_show_user, gpt_say])
+
+        # 已经对该文章的所有片段总结完毕，如果文章被切分了，
+        result = "".join(audio_history)
+        if len(audio_history) > 1:
+            i_say = f"根据以上的对话，使用中文总结文章{result}的主要内容。"
+            i_say_show_user = f'第{index + 1}段音频的主要内容：'
+            gpt_say = yield from request_gpt_model_in_new_thread_with_ui_alive(
+                inputs=i_say,
+                inputs_show_user=i_say_show_user,
+                llm_kwargs=llm_kwargs,
+                chatbot=chatbot,
+                history=audio_history,
+                sys_prompt="总结文章。"
+            )
+
+            history.extend([i_say, gpt_say])
+            audio_history.extend([i_say, gpt_say])
+
+        res = write_results_to_file(history)
+        chatbot.append((f"第{index + 1}段音频完成了吗？", res))
+        yield from update_ui(chatbot=chatbot, history=history)  # 刷新界面
+
+    # 删除中间文件夹
+    import shutil
+    shutil.rmtree('gpt_log/mp3')
+    res = write_results_to_file(history)
+    chatbot.append(("所有音频都总结完成了吗？", res))
+    yield from update_ui(chatbot=chatbot, history=history)
+
+
+@CatchException
+def 总结音视频(txt, llm_kwargs, plugin_kwargs, chatbot, history, system_prompt, WEB_PORT):
+    import glob, os
+
+    # 基本信息：功能、贡献者
+    chatbot.append([
+        "函数插件功能？",
+        "总结音视频内容，函数插件贡献者: dalvqw"])
+    yield from update_ui(chatbot=chatbot, history=history)  # 刷新界面
+
+    try:
+        from moviepy.editor import AudioFileClip
+    except:
+        report_execption(chatbot, history,
+                         a=f"解析项目: {txt}",
+                         b=f"导入软件依赖失败。使用该模块需要额外依赖，安装方法```pip install --upgrade moviepy```。")
+        yield from update_ui(chatbot=chatbot, history=history)  # 刷新界面
+        return
+
+    # 清空历史，以免输入溢出
+    history = []
+
+    # 检测输入参数，如没有给定输入参数，直接退出
+    if os.path.exists(txt):
+        project_folder = txt
+    else:
+        if txt == "": txt = '空空如也的输入栏'
+        report_execption(chatbot, history, a=f"解析项目: {txt}", b=f"找不到本地项目或无权访问: {txt}")
+        yield from update_ui(chatbot=chatbot, history=history)  # 刷新界面
+        return
+
+    # 搜索需要处理的文件清单
+    extensions = ['.mp4', '.m4a', '.wav', '.mpga', '.mpeg', '.mp3', '.avi', '.mkv', '.flac', '.aac']
+
+    if txt.endswith(tuple(extensions)):
+        file_manifest = [txt]
+    else:
+        file_manifest = []
+        for extension in extensions:
+            file_manifest.extend(glob.glob(f'{project_folder}/**/*{extension}', recursive=True))
+
+    # 如果没找到任何文件
+    if len(file_manifest) == 0:
+        report_execption(chatbot, history, a=f"解析项目: {txt}", b=f"找不到任何音频或视频文件: {txt}")
+        yield from update_ui(chatbot=chatbot, history=history)  # 刷新界面
+        return
+
+    # 开始正式执行任务
+    yield from AnalyAudio(file_manifest, llm_kwargs, chatbot, history)
+
+    yield from update_ui(chatbot=chatbot, history=history)  # 刷新界面

From d8540d42a6b1e1d63ac284a0c181505a207a7c4f Mon Sep 17 00:00:00 2001
From: binary-husky <505030475@qq.com>
Date: Fri, 19 May 2023 11:22:25 +0800
Subject: [PATCH 2/4] move dep

---
 crazy_functions/crazy_utils.py | 37 ----------------------------------
 crazy_functions/总结音视频.py  | 37 +++++++++++++++++++++++++++++++++-
 2 files changed, 36 insertions(+), 38 deletions(-)

diff --git a/crazy_functions/crazy_utils.py b/crazy_functions/crazy_utils.py
index 3570ca9..e54136c 100644
--- a/crazy_functions/crazy_utils.py
+++ b/crazy_functions/crazy_utils.py
@@ -606,40 +606,3 @@ def get_files_from_everything(txt, type): # type='.md'
         success = False
 
     return success, file_manifest, project_folder
-
-
-def split_audio_file(filename, split_duration=1000):
-    """
-    根据给定的切割时长将音频文件切割成多个片段。
-
-    Args:
-        filename (str): 需要被切割的音频文件名。
-        split_duration (int, optional): 每个切割音频片段的时长（以秒为单位）。默认值为1000。
-
-    Returns:
-        filelist (list): 一个包含所有切割音频片段文件路径的列表。
-
-    """
-    from moviepy.editor import AudioFileClip
-    import os
-    os.makedirs('gpt_log/mp3/cut/', exist_ok=True)  # 创建存储切割音频的文件夹
-
-    # 读取音频文件
-    audio = AudioFileClip(filename)
-
-    # 计算文件总时长和切割点
-    total_duration = audio.duration
-    split_points = list(range(0, int(total_duration), split_duration))
-    split_points.append(int(total_duration))
-    filelist = []
-
-    # 切割音频文件
-    for i in range(len(split_points) - 1):
-        start_time = split_points[i]
-        end_time = split_points[i + 1]
-        split_audio = audio.subclip(start_time, end_time)
-        split_audio.write_audiofile(f"gpt_log/mp3/cut/{filename[0]}_{i}.mp3")
-        filelist.append(f"gpt_log/mp3/cut/{filename[0]}_{i}.mp3")
-
-    audio.close()
-    return filelist
\ No newline at end of file
diff --git a/crazy_functions/总结音视频.py b/crazy_functions/总结音视频.py
index e391061..5e4f884 100644
--- a/crazy_functions/总结音视频.py
+++ b/crazy_functions/总结音视频.py
@@ -1,6 +1,41 @@
 from toolbox import CatchException, report_execption, select_api_key, update_ui, write_results_to_file
-from .crazy_utils import request_gpt_model_in_new_thread_with_ui_alive, split_audio_file
+from .crazy_utils import request_gpt_model_in_new_thread_with_ui_alive
 
+def split_audio_file(filename, split_duration=1000):
+    """
+    根据给定的切割时长将音频文件切割成多个片段。
+
+    Args:
+        filename (str): 需要被切割的音频文件名。
+        split_duration (int, optional): 每个切割音频片段的时长（以秒为单位）。默认值为1000。
+
+    Returns:
+        filelist (list): 一个包含所有切割音频片段文件路径的列表。
+
+    """
+    from moviepy.editor import AudioFileClip
+    import os
+    os.makedirs('gpt_log/mp3/cut/', exist_ok=True)  # 创建存储切割音频的文件夹
+
+    # 读取音频文件
+    audio = AudioFileClip(filename)
+
+    # 计算文件总时长和切割点
+    total_duration = audio.duration
+    split_points = list(range(0, int(total_duration), split_duration))
+    split_points.append(int(total_duration))
+    filelist = []
+
+    # 切割音频文件
+    for i in range(len(split_points) - 1):
+        start_time = split_points[i]
+        end_time = split_points[i + 1]
+        split_audio = audio.subclip(start_time, end_time)
+        split_audio.write_audiofile(f"gpt_log/mp3/cut/{filename[0]}_{i}.mp3")
+        filelist.append(f"gpt_log/mp3/cut/{filename[0]}_{i}.mp3")
+
+    audio.close()
+    return filelist
 
 def AnalyAudio(file_manifest, llm_kwargs, chatbot, history):
     import os, requests

From c46a8d27e698d95e741e29abee3f9b03c498c68a Mon Sep 17 00:00:00 2001
From: binary-husky <505030475@qq.com>
Date: Fri, 19 May 2023 12:23:01 +0800
Subject: [PATCH 3/4] =?UTF-8?q?=E4=BF=AE=E6=AD=A3=E5=8F=82=E6=95=B0?=
 =?UTF-8?q?=E9=BB=98=E8=AE=A4=E5=80=BCbug?=
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

---
 crazy_functions/图片生成.py            | 1 +
 crazy_functions/解析JupyterNotebook.py | 1 +
 crazy_functions/询问多个大语言模型.py  | 1 +
 3 files changed, 3 insertions(+)

diff --git a/crazy_functions/图片生成.py b/crazy_functions/图片生成.py
index ecb75cd..5bf8bc4 100644
--- a/crazy_functions/图片生成.py
+++ b/crazy_functions/图片生成.py
@@ -55,6 +55,7 @@ def 图片生成(prompt, llm_kwargs, plugin_kwargs, chatbot, history, system_pro
     history = []    # 清空历史，以免输入溢出
     chatbot.append(("这是什么功能？", "[Local Message] 生成图像, 请先把模型切换至gpt-xxxx或者api2d-xxxx。如果中文效果不理想, 尝试Prompt。正在处理中 ....."))
     yield from update_ui(chatbot=chatbot, history=history) # 刷新界面 # 由于请求gpt需要一段时间，我们先及时地做一次界面更新
+    if ("advanced_arg" in plugin_kwargs) and (plugin_kwargs["advanced_arg"] == ""): plugin_kwargs.pop("advanced_arg")
     resolution = plugin_kwargs.get("advanced_arg", '256x256')
     image_url, image_path = gen_image(llm_kwargs, prompt, resolution)
     chatbot.append([prompt,  
diff --git a/crazy_functions/解析JupyterNotebook.py b/crazy_functions/解析JupyterNotebook.py
index 95a3d69..b4bcd56 100644
--- a/crazy_functions/解析JupyterNotebook.py
+++ b/crazy_functions/解析JupyterNotebook.py
@@ -67,6 +67,7 @@ def parseNotebook(filename, enable_markdown=1):
 def ipynb解释(file_manifest, project_folder, llm_kwargs, plugin_kwargs, chatbot, history, system_prompt):
     from .crazy_utils import request_gpt_model_multi_threads_with_very_awesome_ui_and_high_efficiency
 
+    if ("advanced_arg" in plugin_kwargs) and (plugin_kwargs["advanced_arg"] == ""): plugin_kwargs.pop("advanced_arg")
     enable_markdown = plugin_kwargs.get("advanced_arg", "1")
     try:
         enable_markdown = int(enable_markdown)
diff --git a/crazy_functions/询问多个大语言模型.py b/crazy_functions/询问多个大语言模型.py
index 2939d04..ec9fd4a 100644
--- a/crazy_functions/询问多个大语言模型.py
+++ b/crazy_functions/询问多个大语言模型.py
@@ -45,6 +45,7 @@ def 同时问询_指定模型(txt, llm_kwargs, plugin_kwargs, chatbot, history,
     chatbot.append((txt, "正在同时咨询ChatGPT和ChatGLM……"))
     yield from update_ui(chatbot=chatbot, history=history) # 刷新界面 # 由于请求gpt需要一段时间，我们先及时地做一次界面更新
 
+    if ("advanced_arg" in plugin_kwargs) and (plugin_kwargs["advanced_arg"] == ""): plugin_kwargs.pop("advanced_arg")
     # llm_kwargs['llm_model'] = 'chatglm&gpt-3.5-turbo&api2d-gpt-3.5-turbo' # 支持任意数量的llm接口，用&符号分隔
     llm_kwargs['llm_model'] = plugin_kwargs.get("advanced_arg", 'chatglm&gpt-3.5-turbo') # 'chatglm&gpt-3.5-turbo' # 支持任意数量的llm接口，用&符号分隔
     gpt_say = yield from request_gpt_model_in_new_thread_with_ui_alive(

From 7d8338ce70388fcbe5677b7ea6ba20cbc2421f82 Mon Sep 17 00:00:00 2001
From: binary-husky <505030475@qq.com>
Date: Fri, 19 May 2023 12:24:04 +0800
Subject: [PATCH 4/4] =?UTF-8?q?=E5=85=81=E8=AE=B8=E9=9F=B3=E9=A2=91?=
 =?UTF-8?q?=E8=BD=AC=E6=96=87=E5=AD=97=E6=97=B6=E7=9A=84=E9=AB=98=E7=BA=A7?=
 =?UTF-8?q?=E5=8F=82=E6=95=B0=E6=8C=87=E4=BB=A4?=
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

---
 crazy_functional.py           |  2 +-
 crazy_functions/总结音视频.py | 29 ++++++++++++++++++++---------
 2 files changed, 21 insertions(+), 10 deletions(-)

diff --git a/crazy_functional.py b/crazy_functional.py
index f6b7253..462000e 100644
--- a/crazy_functional.py
+++ b/crazy_functional.py
@@ -252,7 +252,7 @@ def get_crazy_functions():
             "Color": "stop",
             "AsButton": False,
             "AdvancedArgs": True,
-            "ArgsReminder": "调用openai api 使用whisper-1模型, 目前支持的格式:mp4, m4a, wav, mpga, mpeg, mp3, 此处无需输入参数",
+            "ArgsReminder": "调用openai api 使用whisper-1模型, 目前支持的格式:mp4, m4a, wav, mpga, mpeg, mp3。此处可以输入解析提示，例如：解析为简体中文（默认）。",
             "Function": HotReload(总结音视频)
         }
     })
diff --git a/crazy_functions/总结音视频.py b/crazy_functions/总结音视频.py
index 5e4f884..62f05d3 100644
--- a/crazy_functions/总结音视频.py
+++ b/crazy_functions/总结音视频.py
@@ -1,4 +1,4 @@
-from toolbox import CatchException, report_execption, select_api_key, update_ui, write_results_to_file
+from toolbox import CatchException, report_execption, select_api_key, update_ui, write_results_to_file, get_conf
 from .crazy_utils import request_gpt_model_in_new_thread_with_ui_alive
 
 def split_audio_file(filename, split_duration=1000):
@@ -37,7 +37,7 @@ def split_audio_file(filename, split_duration=1000):
     audio.close()
     return filelist
 
-def AnalyAudio(file_manifest, llm_kwargs, chatbot, history):
+def AnalyAudio(parse_prompt, file_manifest, llm_kwargs, chatbot, history):
     import os, requests
     from moviepy.editor import AudioFileClip
     from request_llm.bridge_all import model_info
@@ -72,11 +72,20 @@ def AnalyAudio(file_manifest, llm_kwargs, chatbot, history):
                 }
                 data = {
                     "model": "whisper-1",
+                    "prompt": parse_prompt,
                     'response_format': "text"
                 }
-            response = requests.post(url, headers=headers, files=files, data=data).text
 
-            i_say = f'请对下面的文章片段做概述，文章内容是 ```{response}```'
+            chatbot.append([f"将 {i} 发送到openai音频解析终端 (whisper)，当前参数：{parse_prompt}", "正在处理 ..."])
+            yield from update_ui(chatbot=chatbot, history=history)  # 刷新界面
+            proxies, = get_conf('proxies')
+            response = requests.post(url, headers=headers, files=files, data=data, proxies=proxies).text
+
+            chatbot.append(["音频解析结果", response])
+            history.extend(["音频解析结果", response])
+            yield from update_ui(chatbot=chatbot, history=history)  # 刷新界面
+
+            i_say = f'请对下面的音频片段做概述，音频内容是 ```{response}```'
             i_say_show_user = f'第{index + 1}段音频的第{j + 1} / {len(voice)}片段。'
             gpt_say = yield from request_gpt_model_in_new_thread_with_ui_alive(
                 inputs=i_say,
@@ -84,17 +93,17 @@ def AnalyAudio(file_manifest, llm_kwargs, chatbot, history):
                 llm_kwargs=llm_kwargs,
                 chatbot=chatbot,
                 history=[],
-                sys_prompt="总结文章。"
+                sys_prompt=f"总结音频。音频文件名{fp}"
             )
 
             chatbot[-1] = (i_say_show_user, gpt_say)
             history.extend([i_say_show_user, gpt_say])
             audio_history.extend([i_say_show_user, gpt_say])
 
-        # 已经对该文章的所有片段总结完毕，如果文章被切分了，
+        # 已经对该文章的所有片段总结完毕，如果文章被切分了
         result = "".join(audio_history)
         if len(audio_history) > 1:
-            i_say = f"根据以上的对话，使用中文总结文章{result}的主要内容。"
+            i_say = f"根据以上的对话，使用中文总结音频“{result}”的主要内容。"
             i_say_show_user = f'第{index + 1}段音频的主要内容：'
             gpt_say = yield from request_gpt_model_in_new_thread_with_ui_alive(
                 inputs=i_say,
@@ -127,7 +136,7 @@ def 总结音视频(txt, llm_kwargs, plugin_kwargs, chatbot, history, system_pro
     # 基本信息：功能、贡献者
     chatbot.append([
         "函数插件功能？",
-        "总结音视频内容，函数插件贡献者: dalvqw"])
+        "总结音视频内容，函数插件贡献者: dalvqw & BinaryHusky"])
     yield from update_ui(chatbot=chatbot, history=history)  # 刷新界面
 
     try:
@@ -168,6 +177,8 @@ def 总结音视频(txt, llm_kwargs, plugin_kwargs, chatbot, history, system_pro
         return
 
     # 开始正式执行任务
-    yield from AnalyAudio(file_manifest, llm_kwargs, chatbot, history)
+    if ("advanced_arg" in plugin_kwargs) and (plugin_kwargs["advanced_arg"] == ""): plugin_kwargs.pop("advanced_arg")
+    parse_prompt = plugin_kwargs.get("advanced_arg", '将音频解析为简体中文')
+    yield from AnalyAudio(parse_prompt, file_manifest, llm_kwargs, chatbot, history)
 
     yield from update_ui(chatbot=chatbot, history=history)  # 刷新界面