import re
temp = re.sub('[^가-힣]',' ',temp)
- [^가-힣] : 한글이 아닌 모든 문자를 의미하는 정규 표현식.
import konlpy
hannanum = konply.tag.Hannanum()
temp = hannanum.nouns(temp)
import pandas as pd
df_word = pd.DataFrame({'word':nouns})
df_word['count'] = df_word['word'].str.len()
df_word = df_word.groupby('word',as_index=False)
.agg(n=('word','count'))
.sort_values('n', ascending = False)
plt.rcParams.update({'font.family' : 'Malgun Gothic',
'figure.dpi' : 120,
'figure.figsize' : [6.5,6]})
sns.barplot(data =top20, y='word' ,x='n')