kristiyanto · July 3, 2024 14:41
diff --git a/t5.py b/t5.py
 # Refer to the Jupyter Notebook and article for package imports and the complete code.

 model_name = "t5-small"
 tokenizer = T5Tokenizer.from_pretrained(model_name, legacy=False)
 model = T5ForConditionalGeneration.from_pretrained(model_name)

 def summarize_with_t5(text, max_length=80):
     
    if len(text) < max_length:
        return text

    input_text = "summarize: " + text

    input_ids = tokenizer.encode(input_text, return_tensors="pt", truncation=True)   
    summary_ids = model.generate(input_ids, max_length=max_length, min_length=10, length_penalty=0.5, num_beams=4, early_stopping=True)
    summary = tokenizer.decode(summary_ids[0], skip_special_tokens=True)

    return summary

 data['t5_summary'] = data.description.apply(summarize_with_t5)
	# Refer to the Jupyter Notebook and article for package imports and the complete code.

	model_name = "t5-small"
	tokenizer = T5Tokenizer.from_pretrained(model_name, legacy=False)
	model = T5ForConditionalGeneration.from_pretrained(model_name)

	def summarize_with_t5(text, max_length=80):

	if len(text) < max_length:
	return text

	input_text = "summarize: " + text

	input_ids = tokenizer.encode(input_text, return_tensors="pt", truncation=True)
	summary_ids = model.generate(input_ids, max_length=max_length, min_length=10, length_penalty=0.5, num_beams=4, early_stopping=True)
	summary = tokenizer.decode(summary_ids[0], skip_special_tokens=True)

	return summary

	data['t5_summary'] = data.description.apply(summarize_with_t5)
No results found