kristiyanto · July 3, 2024 14:34
diff --git a/sent_score.py b/sent_score.py
 # Refer to the Jupyter Notebook and article for package imports and the complete code.

 def summarize(text, char_limit=80):
    doc = nlp(text.description)
    sentences = [sent.text.strip() for sent in doc.sents]
    keywords = text.keywords

    if not keywords or not sentences:
        return ""
    
    scores = []
    for sentence in sentences:
        score = 0
        for keyword in keywords:
            score += sentence.lower().count(keyword.lower())  # Ensure case-insensitive matching
        scores.append(score)
    
    sorted_sentences = [sent for _, sent in sorted(zip(scores, sentences), reverse=True)]
    
    output = ""
    for i, sentence in enumerate(sorted_sentences):
        if i == 0:
            output += sentence + " "
            continue
        elif (len(output) + len(sentence) + 1 <= char_limit):  
            output += sentence + " "
        else:
            break 
    
    return output.strip()  


 data['summary'] = data.apply(summarize, axis=1)
	# Refer to the Jupyter Notebook and article for package imports and the complete code.

	def summarize(text, char_limit=80):
	doc = nlp(text.description)
	sentences = [sent.text.strip() for sent in doc.sents]
	keywords = text.keywords

	if not keywords or not sentences:
	return ""

	scores = []
	for sentence in sentences:
	score = 0
	for keyword in keywords:
	score += sentence.lower().count(keyword.lower()) # Ensure case-insensitive matching
	scores.append(score)

	sorted_sentences = [sent for _, sent in sorted(zip(scores, sentences), reverse=True)]

	output = ""
	for i, sentence in enumerate(sorted_sentences):
	if i == 0:
	output += sentence + " "
	continue
	elif (len(output) + len(sentence) + 1 <= char_limit):
	output += sentence + " "
	else:
	break

	return output.strip()


	data['summary'] = data.apply(summarize, axis=1)
No results found