forked from sandboxdream/AI-Vtuber
-
Notifications
You must be signed in to change notification settings - Fork 0
/
ks.py
369 lines (303 loc) · 13.9 KB
/
ks.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
from playwright.sync_api import sync_playwright
import logging, os
import time
import threading
import schedule
import random
import traceback
import asyncio
from functools import partial
from google.protobuf.json_format import MessageToDict
from configparser import ConfigParser
import kuaishou_pb2
from utils.common import Common
from utils.logger import Configure_logger
from utils.my_handle import My_handle
from utils.config import Config
config = None
common = None
my_handle = None
last_username_list = None
class kslive(object):
def __init__(self):
global config, common, my_handle
self.path = os.path.abspath('')
self.chrome_path = r"\firefox-1419\firefox\firefox.exe"
self.ua = 'Mozilla/5.0 (Windows NT 10.0; Win64; x64; rv:109.0) Gecko/20100101 Firefox/115.0'
self.uri = 'https://live.kuaishou.com/u/'
self.context = None
self.browser = None
self.page = None
try:
self.live_ids = config.get("room_display_id")
self.thread = 2
# 没什么用的手机号配置,也就方便登录
self.phone = "123"
except Exception as e:
logging.error(traceback.format_exc())
logging.error("请检查配置文件")
exit()
def find_file(self, find_path, file_type) -> list:
"""
寻找文件
:param find_path: 子路径
:param file_type: 文件类型
:return:
"""
path = self.path + "\\" + find_path
data_list = []
for root, dirs, files in os.walk(path):
if root != path:
break
for file in files:
file_path = os.path.join(root, file)
if file_path.find(file_type) != -1:
data_list.append(file_path)
return data_list
def main(self, lid, semaphore):
if not os.path.exists(self.path + "\\cookie"):
os.makedirs(self.path + "\\cookie")
cookie_path=self.path + "\\cookie\\" + self.phone + ".json"
# if not os.path.exists(cookie_path):
# with open(cookie_path, 'w') as file:
# file.write('{"a":"a"}')
# logging.info(f"'{cookie_path}' 创建成功")
# else:
# logging.info(f"'{cookie_path}' 已存在,无需创建")
with semaphore:
thread_name = threading.current_thread().name.split("-")[0]
with sync_playwright() as p:
self.browser = p.firefox.launch(headless=False)
# executable_path=self.path + self.chrome_path
cookie_list = self.find_file("cookie", "json")
if not os.path.exists(cookie_path):
self.context = self.browser.new_context(storage_state=None, user_agent=self.ua)
else:
self.context = self.browser.new_context(storage_state=cookie_list[0], user_agent=self.ua)
self.page = self.context.new_page()
self.page.add_init_script("Object.defineProperties(navigator, {webdriver:{get:()=>undefined}});")
self.page.goto("https://live.kuaishou.com/")
element = self.page.get_attribute('.no-login', "style")
if not element:
self.page.locator('.login').click()
self.page.locator('li.tab-panel:nth-child(2) > h4:nth-child(1)').click()
self.page.locator(
'div.normal-login-item:nth-child(1) > div:nth-child(1) > input:nth-child(1)').fill(
self.phone)
try:
self.page.wait_for_selector("#app > section > div.header-placeholder > header > div.header-main > "
"div.right-part > div.user-info > div.tooltip-trigger > span",
timeout=1000 * 60 * 2)
if not os.path.exists(self.path + "\\cookie"):
os.makedirs(self.path + "\\cookie")
self.context.storage_state(path=cookie_path)
# 检测是否开播
selector = "html body div#app div.live-room div.detail div.player " \
"div.kwai-player.kwai-player-container.kwai-player-rotation-0 " \
"div.kwai-player-container-video div.kwai-player-plugins div.center-state div.state " \
"div.no-live-detail div.desc p.tip" # 检测正在直播时下播的选择器
try:
msg = self.page.locator(selector).text_content(timeout=3000)
logging.info("当前%s" % thread_name + "," + msg)
self.context.close()
self.browser.close()
except Exception as e:
logging.info("当前%s,[%s]正在直播" % (thread_name, lid))
self.page.goto(self.uri + lid)
self.page.on("websocket", self.web_sockets)
self.page.wait_for_selector(selector, timeout=86400000)
logging.error("当前%s,[%s]的直播结束了" % (thread_name, lid))
self.context.close()
self.browser.close()
except Exception:
logging.info("登录失败")
self.context.close()
self.browser.close()
def web_sockets(self, web_socket):
logging.info("web_sockets...")
urls = web_socket.url
logging.info(urls)
if '/websocket' in urls:
web_socket.on("close", self.websocket_close)
web_socket.on("framereceived", self.handler)
def websocket_close(self):
self.context.close()
self.browser.close()
def handler(self, websocket):
Message = kuaishou_pb2.SocketMessage()
Message.ParseFromString(websocket)
if Message.payloadType == 310:
SCWebFeedPUsh = kuaishou_pb2.SCWebFeedPush()
SCWebFeedPUsh.ParseFromString(Message.payload)
obj = MessageToDict(SCWebFeedPUsh, preserving_proto_field_name=True)
logging.debug(obj)
if obj.get('commentFeeds', ''):
msg_list = obj.get('commentFeeds', '')
for i in msg_list:
username = i['user']['userName']
pid = i['user']['principalId']
content = i['content']
logging.info(f"[📧直播间弹幕消息] [{username}]:{content}")
data = {
"username": username,
"content": content
}
my_handle.process_data(data, "comment")
if obj.get('giftFeeds', ''):
msg_list = obj.get('giftFeeds', '')
for i in msg_list:
username = i['user']['userName']
# pid = i['user']['principalId']
giftId = i['giftId']
comboCount = i['comboCount']
logging.info(f"[🎁直播间礼物消息] 用户:{username} 赠送礼物Id={giftId} 连击数={comboCount}")
if obj.get('likeFeeds', ''):
msg_list = obj.get('likeFeeds', '')
for i in msg_list:
username = i['user']['userName']
pid = i['user']['principalId']
logging.info(f"{username}")
class run(kslive):
def __init__(self):
super().__init__()
self.ids_list = self.live_ids.split(",")
def run_live(self):
"""
主程序入口
:return:
"""
t_list = []
# 允许的最大线程数
if self.thread < 1:
self.thread = 1
elif self.thread > 8:
self.thread = 8
logging.info("线程最大允许8,线程数最好设置cpu核心数")
semaphore = threading.Semaphore(self.thread)
# 用于记录数量
n = 0
if not self.live_ids:
logging.info("请导入网页直播id,多个以','间隔")
return
for i in self.ids_list:
n += 1
t = threading.Thread(target=kslive().main, args=(i, semaphore), name=f"线程:{n}-{i}")
t.start()
t_list.append(t)
for i in t_list:
i.join()
def start_server():
global config, common, my_handle, last_username_list
config_path = "config.json"
config = Config(config_path)
common = Common()
# 日志文件路径
log_path = "./log/log-" + common.get_bj_time(1) + ".txt"
Configure_logger(log_path)
# 最新入场的用户名列表
last_username_list = [""]
my_handle = My_handle(config_path)
if my_handle is None:
logging.error("程序初始化失败!")
os._exit(0)
# 定时任务
def schedule_task(index):
global config, common, my_handle, last_username_list
logging.debug("定时任务执行中...")
hour, min = common.get_bj_time(6)
if 0 <= hour and hour < 6:
time = f"凌晨{hour}点{min}分"
elif 6 <= hour and hour < 9:
time = f"早晨{hour}点{min}分"
elif 9 <= hour and hour < 12:
time = f"上午{hour}点{min}分"
elif hour == 12:
time = f"中午{hour}点{min}分"
elif 13 <= hour and hour < 18:
time = f"下午{hour - 12}点{min}分"
elif 18 <= hour and hour < 20:
time = f"傍晚{hour - 12}点{min}分"
elif 20 <= hour and hour < 24:
time = f"晚上{hour - 12}点{min}分"
# 根据对应索引从列表中随机获取一个值
random_copy = random.choice(config.get("schedule")[index]["copy"])
# 假设有多个未知变量,用户可以在此处定义动态变量
variables = {
'time': time,
# 'user_num': last_liveroom_data["OnlineUserCount"],
'last_username': last_username_list[-1],
}
# 使用字典进行字符串替换
if any(var in random_copy for var in variables):
content = random_copy.format(**{var: value for var, value in variables.items() if var in random_copy})
else:
content = random_copy
data = {
"username": None,
"content": content
}
logging.info(f"定时任务:{content}")
my_handle.process_data(data, "schedule")
# 启动定时任务
def run_schedule():
try:
for index, task in enumerate(config.get("schedule")):
if task["enable"]:
# print(task)
# 设置定时任务,每隔n秒执行一次
schedule.every(task["time"]).seconds.do(partial(schedule_task, index))
except Exception as e:
logging.error(e)
while True:
schedule.run_pending()
# time.sleep(1) # 控制每次循环的间隔时间,避免过多占用 CPU 资源
# 创建定时任务子线程并启动
schedule_thread = threading.Thread(target=run_schedule)
schedule_thread.start()
# 启动动态文案
async def run_trends_copywriting():
global config
try:
if False == config.get("trends_copywriting", "enable"):
return
logging.info(f"动态文案任务线程运行中...")
while True:
# 文案文件路径列表
copywriting_file_path_list = []
# 获取动态文案列表
for copywriting in config.get("trends_copywriting", "copywriting"):
# 获取文件夹内所有文件的文件绝对路径,包括文件扩展名
for tmp in common.get_all_file_paths(copywriting["folder_path"]):
copywriting_file_path_list.append(tmp)
# 是否开启随机播放
if config.get("trends_copywriting", "random_play"):
random.shuffle(copywriting_file_path_list)
# 遍历文案文件路径列表
for copywriting_file_path in copywriting_file_path_list:
# 获取文案文件内容
copywriting_file_content = common.read_file_return_content(copywriting_file_path)
# 是否启用提示词对文案内容进行转换
if copywriting["prompt_change_enable"]:
data_json = {
"user_name": "trends_copywriting",
"content": copywriting["prompt_change_content"] + copywriting_file_content
}
# 调用函数进行LLM处理,以及生成回复内容,进行音频合成,需要好好考虑考虑实现
data_json["content"] = my_handle.llm_handle(config.get("chat_type"), data_json)
else:
data_json = {
"user_name": "trends_copywriting",
"content": copywriting_file_content
}
# 空数据判断
if data_json["content"] != None and data_json["content"] != "":
# 发给直接复读进行处理
my_handle.reread_handle(data_json)
await asyncio.sleep(config.get("trends_copywriting", "play_interval"))
except Exception as e:
logging.error(traceback.format_exc())
# 创建动态文案子线程并启动
threading.Thread(target=lambda: asyncio.run(run_trends_copywriting())).start()
run().run_live()
if __name__ == '__main__':
start_server()