Spaces:

deeme
/

long

Paused

App Files Files Community

long / summary.py

deeme

Upload 111 files

217acfe verified 11 months ago

raw

history blame contribute delete

5.49 kB

	import time
	from core.parser_utils import parse_chapters
	from core.summary_novel import summary_draft, summary_plot, summary_chapters
	from config import MAX_NOVEL_SUMMARY_LENGTH, MAX_THREAD_NUM, ENABLE_ONLINE_DEMO

	def batch_yield(generators, max_co_num=5, ret=[]):
	results = [None] * len(generators)
	yields = [None] * len(generators)
	finished = [False] * len(generators)

	while True:
	co_num = 0
	for i, gen in enumerate(generators):
	if finished[i]:
	continue

	try:
	co_num += 1
	yield_value = next(gen)
	yields[i] = yield_value
	except StopIteration as e:
	results[i] = e.value
	finished[i] = True

	if co_num >= max_co_num:
	break

	if all(finished):
	break

	yield yields

	ret.clear()
	ret.extend(results)
	return ret

	def process_novel(content, novel_name, model, sub_model, max_novel_summary_length, max_thread_num):
	if ENABLE_ONLINE_DEMO:
	if max_novel_summary_length > MAX_NOVEL_SUMMARY_LENGTH:
	raise Exception("在线Demo模型下，最大小说长度不能超过" + str(MAX_NOVEL_SUMMARY_LENGTH) + "个字符！")
	if max_thread_num > MAX_THREAD_NUM:
	raise Exception("在线Demo模型下，最大线程数不能超过" + str(MAX_THREAD_NUM) + "！")

	if len(content) > max_novel_summary_length:
	content = content[:max_novel_summary_length]
	yield {"progress_msg": f"小说长度超出最大处理长度，已截断，只处理前{max_novel_summary_length}个字符。"}
	time.sleep(1)

	# Parse chapters
	yield {"progress_msg": "正在解析章节..."}

	chapter_titles, chapter_contents = parse_chapters(content)

	yield {"progress_msg": "解析出章节数：" + str(len(chapter_titles))}

	if len(chapter_titles) == 0:
	raise Exception("解析出章节数为0！！！")

	# Process draft summaries
	yield {"progress_msg": "正在生成剧情摘要..."}
	dw_list = []
	gens = [summary_draft(model, sub_model, ' '.join(title), content) for title, content in zip(chapter_titles, chapter_contents)]
	for yields in batch_yield(gens, ret=dw_list, max_co_num=max_thread_num):
	chars_num = sum([e['chars_num'] for e in yields if e is not None])
	current_cost = sum([e['current_cost'] for e in yields if e is not None])
	currency_symbol = next(e['currency_symbol'] for e in yields if e is not None)
	model_text = next(e['model'] for e in yields if e is not None)
	yield {"progress_msg": f"正在生成剧情摘要进度：{sum([1 for e in yields if e is not None])} / {len(yields)} 模型：{model_text} 已生成字符：{chars_num} 已花费：{current_cost:.4f}{currency_symbol}"}

	# Process plot summaries
	yield {"progress_msg": "正在生成章节大纲..."}
	cw_list = []
	gens = [summary_plot(model, sub_model, ' '.join(title), dw.x) for title, dw in zip(chapter_titles, dw_list)]
	for yields in batch_yield(gens, ret=cw_list, max_co_num=max_thread_num):
	chars_num = sum([e['chars_num'] for e in yields if e is not None])
	current_cost = sum([e['current_cost'] for e in yields if e is not None])
	currency_symbol = next(e['currency_symbol'] for e in yields if e is not None)
	model_text = next(e['model'] for e in yields if e is not None)
	yield {"progress_msg": f"正在生成章节大纲进度：{sum([1 for e in yields if e is not None])} / {len(yields)} 模型：{model_text} 已生成字符：{chars_num} 已花费：{current_cost:.4f}{currency_symbol}"}

	# Process chapter summaries
	yield {"progress_msg": "正在生成全书大纲..."}
	ow_list = []
	gens = [summary_chapters(model, sub_model, novel_name, chapter_titles, [cw.global_context['chapter'] for cw in cw_list])]
	for yields in batch_yield(gens, ret=ow_list, max_co_num=max_thread_num):
	chars_num = sum([e['chars_num'] for e in yields if e is not None])
	current_cost = sum([e['current_cost'] for e in yields if e is not None])
	currency_symbol = next(e['currency_symbol'] for e in yields if e is not None)
	model_text = next(e['model'] for e in yields if e is not None)
	yield {"progress_msg": f"正在生成全书大纲模型：{model_text} 已生成字符：{chars_num} 已花费：{current_cost:.4f}{currency_symbol}"}

	# Prepare final response
	outline = ow_list[0]
	plot_data = {}
	draft_data = {}

	for title, chapter_outline, cw, dw in zip(chapter_titles, [e[1] for e in outline.xy_pairs], cw_list, dw_list):
	chapter_name = ' '.join(title)
	plot_data[chapter_name] = {
	'chunks': [('', e) for e, _ in dw.xy_pairs],
	'context': chapter_outline # 不采用cw.global_context['chapter']，因为不含章节名
	}
	draft_data[chapter_name] = {
	'chunks': dw.xy_pairs,
	'context': '' # Draft doesn't have global context
	}

	final_response = {
	"progress_msg": "处理完成！",
	"outline": {
	"chunks": outline.xy_pairs,
	"context": outline.global_context['outline']
	},
	"plot": plot_data,
	"draft": draft_data
	}

	yield final_response