명사 빈도수 계산 함수
중복단어 일렬로 세우기
def noun_counter(doc, num=10):
from collections import Counter
result = Counter(doc)
most_word = result.most_common(num)
return most_word
def get_word_list(noun, n):
most_word = noun_counter(noun, n)
word_list = []
for i in range(n):
word = most_word[i][0]
word_list.append(word)
return word_list
중복단어를 제거하면서 위에서부터 단어 키워드 추출
def get_word_list(noun, n):
most_word = noun_counter(noun, n)
word_list = []
for i in range(n):
word = most_word[i][0]
word_list.append(word)
return word_list
결과 실행
상위 20개 추출
word1_list_fre = get_word_list(word1, 20)
word2_list_fre = get_word_list(word1, 20)
word3_list_fre = get_word_list(word1, 20)
word4_list_fre = get_word_list(word1, 20)
word5_list_fre = get_word_list(word1, 20)
word6_list_fre = get_word_list(word1, 20)