Spaces:

JennySHT
/

summary

Running

summary / app.py

Update app.py

c5f9a82 verified 4 months ago

1.27 kB

	import streamlit as st
	from transformers import T5ForConditionalGeneration, T5Tokenizer
	import opencc

	# 使用中文摘要模型
	local_path = 'utrobinmv/t5_summary_en_ru_zh_base_2048'
	model = T5ForConditionalGeneration.from_pretrained(local_path)
	tokenizer = T5Tokenizer.from_pretrained(local_path)



	# Streamlit UI
	st.title("中文文章摘要工具")
	# Create an OpenCC converter for converting simplified Chinese to traditional Chinese
	converter = opencc.OpenCC('s2t')
	# Input text area for the article
	article = st.text_area("請輸入文章", "")

	# Function to generate summary
	@st.cache_data
	def generate_summary(article):
	inputs = tokenizer.encode("摘要：" + article, return_tensors="pt", max_length=1024, truncation=True)
	summary_ids = model.generate(inputs, max_length=180, min_length=60, length_penalty=2.0, num_beams=4, early_stopping=True)
	summary = tokenizer.decode(summary_ids[0], skip_special_tokens=True)
	return summary

	# Button to generate summary
	if st.button("生成摘要"):
	if article.strip() == "":
	st.error("請輸入文章。")
	else:
	summary = generate_summary(article)
	traditional_summary = converter.convert(summary)
	st.subheader("摘要:")
	st.write(traditional_summary)