608 lines
20 KiB
Python
608 lines
20 KiB
Python
"""
|
||
Main.py
|
||
"""
|
||
|
||
from transformers import AutoModel, AutoTokenizer
|
||
import time
|
||
import importlib
|
||
from toolbox import update_ui, get_conf
|
||
from multiprocessing import Process, Pipe
|
||
import argparse
|
||
import asyncio
|
||
import json
|
||
import os
|
||
import random
|
||
import re
|
||
import ssl
|
||
import sys
|
||
import uuid
|
||
from enum import Enum
|
||
from pathlib import Path
|
||
from typing import Generator
|
||
from typing import Literal
|
||
from typing import Optional
|
||
from typing import Union
|
||
import certifi
|
||
import httpx
|
||
import websockets.client as websockets
|
||
from prompt_toolkit import PromptSession
|
||
from prompt_toolkit.auto_suggest import AutoSuggestFromHistory
|
||
from prompt_toolkit.completion import WordCompleter
|
||
from prompt_toolkit.history import InMemoryHistory
|
||
from prompt_toolkit.key_binding import KeyBindings
|
||
from rich.live import Live
|
||
from rich.markdown import Markdown
|
||
|
||
DELIMITER = "\x1e"
|
||
|
||
|
||
# Generate random IP between range 13.104.0.0/14
|
||
FORWARDED_IP = (
|
||
f"13.{random.randint(104, 107)}.{random.randint(0, 255)}.{random.randint(0, 255)}"
|
||
)
|
||
|
||
HEADERS = {
|
||
"accept": "application/json",
|
||
"accept-language": "en-US,en;q=0.9",
|
||
"content-type": "application/json",
|
||
"sec-ch-ua": '"Not_A Brand";v="99", "Microsoft Edge";v="110", "Chromium";v="110"',
|
||
"sec-ch-ua-arch": '"x86"',
|
||
"sec-ch-ua-bitness": '"64"',
|
||
"sec-ch-ua-full-version": '"109.0.1518.78"',
|
||
"sec-ch-ua-full-version-list": '"Chromium";v="110.0.5481.192", "Not A(Brand";v="24.0.0.0", "Microsoft Edge";v="110.0.1587.69"',
|
||
"sec-ch-ua-mobile": "?0",
|
||
"sec-ch-ua-model": "",
|
||
"sec-ch-ua-platform": '"Windows"',
|
||
"sec-ch-ua-platform-version": '"15.0.0"',
|
||
"sec-fetch-dest": "empty",
|
||
"sec-fetch-mode": "cors",
|
||
"sec-fetch-site": "same-origin",
|
||
"x-ms-client-request-id": str(uuid.uuid4()),
|
||
"x-ms-useragent": "azsdk-js-api-client-factory/1.0.0-beta.1 core-rest-pipeline/1.10.0 OS/Win32",
|
||
"Referer": "https://www.bing.com/search?q=Bing+AI&showconv=1&FORM=hpcodx",
|
||
"Referrer-Policy": "origin-when-cross-origin",
|
||
"x-forwarded-for": FORWARDED_IP,
|
||
}
|
||
|
||
HEADERS_INIT_CONVER = {
|
||
"authority": "edgeservices.bing.com",
|
||
"accept": "text/html,application/xhtml+xml,application/xml;q=0.9,image/webp,image/apng,*/*;q=0.8,application/signed-exchange;v=b3;q=0.7",
|
||
"accept-language": "en-US,en;q=0.9",
|
||
"cache-control": "max-age=0",
|
||
"sec-ch-ua": '"Chromium";v="110", "Not A(Brand";v="24", "Microsoft Edge";v="110"',
|
||
"sec-ch-ua-arch": '"x86"',
|
||
"sec-ch-ua-bitness": '"64"',
|
||
"sec-ch-ua-full-version": '"110.0.1587.69"',
|
||
"sec-ch-ua-full-version-list": '"Chromium";v="110.0.5481.192", "Not A(Brand";v="24.0.0.0", "Microsoft Edge";v="110.0.1587.69"',
|
||
"sec-ch-ua-mobile": "?0",
|
||
"sec-ch-ua-model": '""',
|
||
"sec-ch-ua-platform": '"Windows"',
|
||
"sec-ch-ua-platform-version": '"15.0.0"',
|
||
"sec-fetch-dest": "document",
|
||
"sec-fetch-mode": "navigate",
|
||
"sec-fetch-site": "none",
|
||
"sec-fetch-user": "?1",
|
||
"upgrade-insecure-requests": "1",
|
||
"user-agent": "Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/110.0.0.0 Safari/537.36 Edg/110.0.1587.69",
|
||
"x-edge-shopping-flag": "1",
|
||
"x-forwarded-for": FORWARDED_IP,
|
||
}
|
||
|
||
ssl_context = ssl.create_default_context()
|
||
ssl_context.load_verify_locations(certifi.where())
|
||
|
||
|
||
class NotAllowedToAccess(Exception):
|
||
pass
|
||
|
||
|
||
class ConversationStyle(Enum):
|
||
creative = "h3imaginative,clgalileo,gencontentv3"
|
||
balanced = "galileo"
|
||
precise = "h3precise,clgalileo"
|
||
|
||
|
||
CONVERSATION_STYLE_TYPE = Optional[
|
||
Union[ConversationStyle, Literal["creative", "balanced", "precise"]]
|
||
]
|
||
|
||
|
||
def _append_identifier(msg: dict) -> str:
|
||
"""
|
||
Appends special character to end of message to identify end of message
|
||
"""
|
||
# Convert dict to json string
|
||
return json.dumps(msg) + DELIMITER
|
||
|
||
|
||
def _get_ran_hex(length: int = 32) -> str:
|
||
"""
|
||
Returns random hex string
|
||
"""
|
||
return "".join(random.choice("0123456789abcdef") for _ in range(length))
|
||
|
||
|
||
class _ChatHubRequest:
|
||
"""
|
||
Request object for ChatHub
|
||
"""
|
||
|
||
def __init__(
|
||
self,
|
||
conversation_signature: str,
|
||
client_id: str,
|
||
conversation_id: str,
|
||
invocation_id: int = 0,
|
||
) -> None:
|
||
self.struct: dict = {}
|
||
|
||
self.client_id: str = client_id
|
||
self.conversation_id: str = conversation_id
|
||
self.conversation_signature: str = conversation_signature
|
||
self.invocation_id: int = invocation_id
|
||
|
||
def update(
|
||
self,
|
||
prompt: str,
|
||
conversation_style: CONVERSATION_STYLE_TYPE,
|
||
options: list | None = None,
|
||
) -> None:
|
||
"""
|
||
Updates request object
|
||
"""
|
||
if options is None:
|
||
options = [
|
||
"deepleo",
|
||
"enable_debug_commands",
|
||
"disable_emoji_spoken_text",
|
||
"enablemm",
|
||
]
|
||
if conversation_style:
|
||
if not isinstance(conversation_style, ConversationStyle):
|
||
conversation_style = getattr(ConversationStyle, conversation_style)
|
||
options = [
|
||
"nlu_direct_response_filter",
|
||
"deepleo",
|
||
"disable_emoji_spoken_text",
|
||
"responsible_ai_policy_235",
|
||
"enablemm",
|
||
conversation_style.value,
|
||
"dtappid",
|
||
"cricinfo",
|
||
"cricinfov2",
|
||
"dv3sugg",
|
||
]
|
||
self.struct = {
|
||
"arguments": [
|
||
{
|
||
"source": "cib",
|
||
"optionsSets": options,
|
||
"sliceIds": [
|
||
"222dtappid",
|
||
"225cricinfo",
|
||
"224locals0",
|
||
],
|
||
"traceId": _get_ran_hex(32),
|
||
"isStartOfSession": self.invocation_id == 0,
|
||
"message": {
|
||
"author": "user",
|
||
"inputMethod": "Keyboard",
|
||
"text": prompt,
|
||
"messageType": "Chat",
|
||
},
|
||
"conversationSignature": self.conversation_signature,
|
||
"participant": {
|
||
"id": self.client_id,
|
||
},
|
||
"conversationId": self.conversation_id,
|
||
},
|
||
],
|
||
"invocationId": str(self.invocation_id),
|
||
"target": "chat",
|
||
"type": 4,
|
||
}
|
||
self.invocation_id += 1
|
||
|
||
|
||
class _Conversation:
|
||
"""
|
||
Conversation API
|
||
"""
|
||
|
||
def __init__(
|
||
self,
|
||
cookies: dict,
|
||
proxy: str | None = None,
|
||
) -> None:
|
||
self.struct: dict = {
|
||
"conversationId": None,
|
||
"clientId": None,
|
||
"conversationSignature": None,
|
||
"result": {"value": "Success", "message": None},
|
||
}
|
||
self.proxy = proxy
|
||
proxy = (
|
||
proxy
|
||
or os.environ.get("all_proxy")
|
||
or os.environ.get("ALL_PROXY")
|
||
or os.environ.get("https_proxy")
|
||
or os.environ.get("HTTPS_PROXY")
|
||
or None
|
||
)
|
||
if proxy is not None and proxy.startswith("socks5h://"):
|
||
proxy = "socks5://" + proxy[len("socks5h://") :]
|
||
self.session = httpx.Client(
|
||
proxies=proxy,
|
||
timeout=30,
|
||
headers=HEADERS_INIT_CONVER,
|
||
)
|
||
for cookie in cookies:
|
||
self.session.cookies.set(cookie["name"], cookie["value"])
|
||
|
||
# Send GET request
|
||
response = self.session.get(
|
||
url=os.environ.get("BING_PROXY_URL")
|
||
or "https://edgeservices.bing.com/edgesvc/turing/conversation/create",
|
||
)
|
||
if response.status_code != 200:
|
||
response = self.session.get(
|
||
"https://edge.churchless.tech/edgesvc/turing/conversation/create",
|
||
)
|
||
if response.status_code != 200:
|
||
print(f"Status code: {response.status_code}")
|
||
print(response.text)
|
||
print(response.url)
|
||
raise Exception("Authentication failed")
|
||
try:
|
||
self.struct = response.json()
|
||
except (json.decoder.JSONDecodeError, NotAllowedToAccess) as exc:
|
||
raise Exception(
|
||
"Authentication failed. You have not been accepted into the beta.",
|
||
) from exc
|
||
if self.struct["result"]["value"] == "UnauthorizedRequest":
|
||
raise NotAllowedToAccess(self.struct["result"]["message"])
|
||
|
||
|
||
class _ChatHub:
|
||
"""
|
||
Chat API
|
||
"""
|
||
|
||
def __init__(self, conversation: _Conversation) -> None:
|
||
self.wss: websockets.WebSocketClientProtocol | None = None
|
||
self.request: _ChatHubRequest
|
||
self.loop: bool
|
||
self.task: asyncio.Task
|
||
self.request = _ChatHubRequest(
|
||
conversation_signature=conversation.struct["conversationSignature"],
|
||
client_id=conversation.struct["clientId"],
|
||
conversation_id=conversation.struct["conversationId"],
|
||
)
|
||
|
||
async def ask_stream(
|
||
self,
|
||
prompt: str,
|
||
wss_link: str,
|
||
conversation_style: CONVERSATION_STYLE_TYPE = None,
|
||
raw: bool = False,
|
||
options: dict = None,
|
||
) -> Generator[str, None, None]:
|
||
"""
|
||
Ask a question to the bot
|
||
"""
|
||
if self.wss and not self.wss.closed:
|
||
await self.wss.close()
|
||
# Check if websocket is closed
|
||
self.wss = await websockets.connect(
|
||
wss_link,
|
||
extra_headers=HEADERS,
|
||
max_size=None,
|
||
ssl=ssl_context,
|
||
)
|
||
await self._initial_handshake()
|
||
# Construct a ChatHub request
|
||
self.request.update(
|
||
prompt=prompt,
|
||
conversation_style=conversation_style,
|
||
options=options,
|
||
)
|
||
# Send request
|
||
await self.wss.send(_append_identifier(self.request.struct))
|
||
final = False
|
||
while not final:
|
||
objects = str(await self.wss.recv()).split(DELIMITER)
|
||
for obj in objects:
|
||
if obj is None or not obj:
|
||
continue
|
||
response = json.loads(obj)
|
||
if response.get("type") != 2 and raw:
|
||
yield False, response
|
||
elif response.get("type") == 1 and response["arguments"][0].get(
|
||
"messages",
|
||
):
|
||
resp_txt = response["arguments"][0]["messages"][0]["adaptiveCards"][
|
||
0
|
||
]["body"][0].get("text")
|
||
yield False, resp_txt
|
||
elif response.get("type") == 2:
|
||
final = True
|
||
yield True, response
|
||
|
||
async def _initial_handshake(self) -> None:
|
||
await self.wss.send(_append_identifier({"protocol": "json", "version": 1}))
|
||
await self.wss.recv()
|
||
|
||
async def close(self) -> None:
|
||
"""
|
||
Close the connection
|
||
"""
|
||
if self.wss and not self.wss.closed:
|
||
await self.wss.close()
|
||
|
||
|
||
class Chatbot:
|
||
"""
|
||
Combines everything to make it seamless
|
||
"""
|
||
|
||
def __init__(
|
||
self,
|
||
cookies: dict = None,
|
||
proxy: str | None = None,
|
||
cookie_path: str = None,
|
||
) -> None:
|
||
if cookies is None:
|
||
cookies = {}
|
||
if cookie_path is not None:
|
||
try:
|
||
with open(cookie_path, encoding="utf-8") as f:
|
||
self.cookies = json.load(f)
|
||
except FileNotFoundError as exc:
|
||
raise FileNotFoundError("Cookie file not found") from exc
|
||
else:
|
||
self.cookies = cookies
|
||
self.proxy: str | None = proxy
|
||
self.chat_hub: _ChatHub = _ChatHub(
|
||
_Conversation(self.cookies, self.proxy),
|
||
)
|
||
|
||
async def ask(
|
||
self,
|
||
prompt: str,
|
||
wss_link: str = "wss://sydney.bing.com/sydney/ChatHub",
|
||
conversation_style: CONVERSATION_STYLE_TYPE = None,
|
||
options: dict = None,
|
||
) -> dict:
|
||
"""
|
||
Ask a question to the bot
|
||
"""
|
||
async for final, response in self.chat_hub.ask_stream(
|
||
prompt=prompt,
|
||
conversation_style=conversation_style,
|
||
wss_link=wss_link,
|
||
options=options,
|
||
):
|
||
if final:
|
||
return response
|
||
await self.chat_hub.wss.close()
|
||
return None
|
||
|
||
async def ask_stream(
|
||
self,
|
||
prompt: str,
|
||
wss_link: str = "wss://sydney.bing.com/sydney/ChatHub",
|
||
conversation_style: CONVERSATION_STYLE_TYPE = None,
|
||
raw: bool = False,
|
||
options: dict = None,
|
||
) -> Generator[str, None, None]:
|
||
"""
|
||
Ask a question to the bot
|
||
"""
|
||
async for response in self.chat_hub.ask_stream(
|
||
prompt=prompt,
|
||
conversation_style=conversation_style,
|
||
wss_link=wss_link,
|
||
raw=raw,
|
||
options=options,
|
||
):
|
||
yield response
|
||
|
||
async def close(self) -> None:
|
||
"""
|
||
Close the connection
|
||
"""
|
||
await self.chat_hub.close()
|
||
|
||
async def reset(self) -> None:
|
||
"""
|
||
Reset the conversation
|
||
"""
|
||
await self.close()
|
||
self.chat_hub = _ChatHub(_Conversation(self.cookies))
|
||
|
||
|
||
async def _get_input_async(
|
||
session: PromptSession = None,
|
||
completer: WordCompleter = None,
|
||
) -> str:
|
||
"""
|
||
Multiline input function.
|
||
"""
|
||
return await session.prompt_async(
|
||
completer=completer,
|
||
multiline=True,
|
||
auto_suggest=AutoSuggestFromHistory(),
|
||
)
|
||
|
||
|
||
def _create_session() -> PromptSession:
|
||
kb = KeyBindings()
|
||
|
||
@kb.add("enter")
|
||
def _(event):
|
||
buffer_text = event.current_buffer.text
|
||
if buffer_text.startswith("!"):
|
||
event.current_buffer.validate_and_handle()
|
||
else:
|
||
event.current_buffer.insert_text("\n")
|
||
|
||
@kb.add("escape")
|
||
def _(event):
|
||
if event.current_buffer.complete_state:
|
||
# event.current_buffer.cancel_completion()
|
||
event.current_buffer.text = ""
|
||
|
||
return PromptSession(key_bindings=kb, history=InMemoryHistory())
|
||
|
||
|
||
def _create_completer(commands: list, pattern_str: str = "$"):
|
||
return WordCompleter(words=commands, pattern=re.compile(pattern_str))
|
||
|
||
|
||
load_message = ""
|
||
|
||
#################################################################################
|
||
#################################################################################
|
||
#################################################################################
|
||
#################################################################################
|
||
#################################################################################
|
||
#################################################################################
|
||
class GetNewBingHandle(Process):
|
||
def __init__(self):
|
||
super().__init__(daemon=True)
|
||
self.parent, self.child = Pipe()
|
||
self.chatglm_model = None
|
||
self.chatglm_tokenizer = None
|
||
self.info = ""
|
||
self.success = True
|
||
self.check_dependency()
|
||
self.start()
|
||
|
||
def check_dependency(self):
|
||
try:
|
||
import rich
|
||
self.info = "依赖检测通过"
|
||
self.success = True
|
||
except:
|
||
self.info = "缺少的依赖,如果要使用Newbing,除了基础的pip依赖以外,您还需要运行`pip install -r request_llm/requirements_newbing.txt`安装Newbing的依赖。"
|
||
self.success = False
|
||
|
||
def ready(self):
|
||
return self.chatglm_model is not None
|
||
|
||
async def async_run(self, question):
|
||
async for final, response in self.chatglm_model.ask_stream(
|
||
prompt=question,
|
||
conversation_style="balanced", # ["creative", "balanced", "precise"]
|
||
wss_link="wss://sydney.bing.com/sydney/ChatHub", # "wss://sydney.bing.com/sydney/ChatHub"
|
||
):
|
||
if not final:
|
||
self.child.send(response)
|
||
print(response)
|
||
|
||
def run(self):
|
||
# 第一次运行,加载参数
|
||
retry = 0
|
||
while True:
|
||
try:
|
||
if self.chatglm_model is None:
|
||
proxies, = get_conf('proxies')
|
||
newbing_cookies, = get_conf('newbing_cookies')
|
||
cookies = json.loads(newbing_cookies)
|
||
self.chatglm_model = Chatbot(proxy=proxies['https'], cookies=cookies)
|
||
break
|
||
else:
|
||
break
|
||
except:
|
||
retry += 1
|
||
if retry > 3:
|
||
self.child.send('[Local Message] 不能加载Newbing组件。')
|
||
raise RuntimeError("不能加载Newbing组件。")
|
||
|
||
# 进入任务等待状态
|
||
while True:
|
||
kwargs = self.child.recv()
|
||
try:
|
||
asyncio.run(self.async_run(question=kwargs['query']))
|
||
except:
|
||
self.child.send('[Local Message] Newbing失败.')
|
||
self.child.send('[Finish]')
|
||
|
||
def stream_chat(self, **kwargs):
|
||
self.parent.send(kwargs)
|
||
while True:
|
||
res = self.parent.recv()
|
||
if res != '[Finish]':
|
||
yield res
|
||
else:
|
||
break
|
||
return
|
||
|
||
global glm_handle
|
||
glm_handle = None
|
||
#################################################################################
|
||
def predict_no_ui_long_connection(inputs, llm_kwargs, history=[], sys_prompt="", observe_window=None, console_slience=False):
|
||
"""
|
||
多线程方法
|
||
函数的说明请见 request_llm/bridge_all.py
|
||
"""
|
||
global glm_handle
|
||
if glm_handle is None:
|
||
glm_handle = GetNewBingHandle()
|
||
observe_window[0] = load_message + "\n\n" + glm_handle.info
|
||
if not glm_handle.success:
|
||
error = glm_handle.info
|
||
glm_handle = None
|
||
raise RuntimeError(error)
|
||
|
||
# chatglm 没有 sys_prompt 接口,因此把prompt加入 history
|
||
history_feedin = []
|
||
history_feedin.append(["What can I do?", sys_prompt])
|
||
for i in range(len(history)//2):
|
||
history_feedin.append([history[2*i], history[2*i+1]] )
|
||
|
||
watch_dog_patience = 5 # 看门狗 (watchdog) 的耐心, 设置5秒即可
|
||
response = ""
|
||
for response in glm_handle.stream_chat(query=inputs, history=history_feedin, max_length=llm_kwargs['max_length'], top_p=llm_kwargs['top_p'], temperature=llm_kwargs['temperature']):
|
||
observe_window[0] = response
|
||
if len(observe_window) >= 2:
|
||
if (time.time()-observe_window[1]) > watch_dog_patience:
|
||
raise RuntimeError("程序终止。")
|
||
return response
|
||
|
||
|
||
|
||
def predict(inputs, llm_kwargs, plugin_kwargs, chatbot, history=[], system_prompt='', stream = True, additional_fn=None):
|
||
"""
|
||
单线程方法
|
||
函数的说明请见 request_llm/bridge_all.py
|
||
"""
|
||
chatbot.append((inputs, ""))
|
||
|
||
global glm_handle
|
||
if glm_handle is None:
|
||
glm_handle = GetNewBingHandle()
|
||
chatbot[-1] = (inputs, load_message + "\n\n" + glm_handle.info)
|
||
yield from update_ui(chatbot=chatbot, history=[])
|
||
if not glm_handle.success:
|
||
glm_handle = None
|
||
return
|
||
|
||
if additional_fn is not None:
|
||
import core_functional
|
||
importlib.reload(core_functional) # 热更新prompt
|
||
core_functional = core_functional.get_core_functions()
|
||
if "PreProcess" in core_functional[additional_fn]: inputs = core_functional[additional_fn]["PreProcess"](inputs) # 获取预处理函数(如果有的话)
|
||
inputs = core_functional[additional_fn]["Prefix"] + inputs + core_functional[additional_fn]["Suffix"]
|
||
|
||
history_feedin = []
|
||
history_feedin.append(["What can I do?", system_prompt] )
|
||
for i in range(len(history)//2):
|
||
history_feedin.append([history[2*i], history[2*i+1]] )
|
||
|
||
for response in glm_handle.stream_chat(query=inputs, history=history_feedin, max_length=llm_kwargs['max_length'], top_p=llm_kwargs['top_p'], temperature=llm_kwargs['temperature']):
|
||
chatbot[-1] = (inputs, response)
|
||
yield from update_ui(chatbot=chatbot, history=history)
|
||
|
||
history.extend([inputs, response])
|
||
yield from update_ui(chatbot=chatbot, history=history) |