LegSum / Summarizer /Extractive.py
d0r1h's picture
Create Extractive.py
d3c86fd
raw
history blame
534 Bytes
import nltk
from sumy.parsers.plaintext import PlaintextParser
from sumy.summarizers.luhn import LuhnSummarizer
from sumy.nlp.tokenizers import Tokenizer
nltk.download('punkt')
def summarize(file, SENTENCES_COUNT):
sumarizer = LuhnSummarizer()
with open(file.name) as f:
doc = f.read()
sentences_ = []
doc_ = PlaintextParser(doc, Tokenizer("en")).document
for sentence in sumarizer(doc_, SENTENCES_COUNT):
sentences_.append(str(sentence))
summm_ = " ".join(sentences_)
return summm_