텍스트마이닝2

Daum·2021년 4월 2일
0

Big Data

목록 보기
5/7
post-thumbnail
import pytagcloud
import random
import webbrowser
from konlpy.tag import Okt
from collections import Counter
def get_tags(text, ntags=20, multiplier=2):
  t = Okt()
  nouns = []
  for sentence in text:
    for noun in t.nouns(sentence):
      nouns.append(noun)
      count = Counter(nouns)
  return [{'color': color(),'tag':n,'size':2*c*multiplier} for n,c in count.most_common(ntags)]
 
r = lambda: random.randint(0, 255)
color = lambda: (r(), r(), r())

def draw_cloud(tags, filename, fontname = 'Nobile',size1 = (1300,800)):
  pytagcloud.create_tag_image(tags, 'wordcloud.png',fontname=fontname,size=size1)
  webbrowser.open('wordcloud.png')

musinsa = []
file = open('musinsa.txt', 'r', encoding ='utf-8')
lines = file.readlines()

for line in lines:
  musinsa.append(line)
file.close()

tags = get_tags(musinsa)
print(tags)

draw_cloud(tags,'wordcloud.png')

0개의 댓글