Author : tmlab / Date : 2016. 10. 7. 14:55 / Category : Text Mining/Python
from konlpy.tag import Kkma
kkma=Kkma()
kkma.pos("아버지가 방에 들어가신다")
import xlrd
workbook = xlrd.open_workbook("./hd.xlsx")
worksheet = workbook.sheet_by_index(0)
nrows=worksheet.nrows
# 빈 리스트를 생성
row_val1=[]
# 생성된 리스트에 각 row의 값들을 append
for row_num in range(nrows):
row_val1.append(worksheet.row_values(row_num))
from konlpy.tag import Kkma
kkma=Kkma()
def hidden_char(word):
class __password:
def __repr__(self):
if word=="":
return ""
else:
return "*" * (len(word)-1)
wd = __password()
if word=="":
return ""
else:
return word[0]+str(wd)
for i in range(0,len(row_val1)):
row_val1[i][1] = hidden_char(row_val1[i][1])
print(i)
row_val1[2]
len(row_val1)
for i in range(0,int(len(row_val1))):
print(i)
if i is 0:
row_val1[i].append("article_POS")
else:
if row_val1[i][3] == ' ' or row_val1[i][3] == ' ':
row_val1.append("")
elif row_val1[i][3] == 42:
row_val1.append("")
else:
y=kkma.pos(row_val1[i][3])
# 분석된 결과를 단어/품사; 형태로 바꾸기 위한 코드
b=""
for j in range(0,int(len(y))):
b=b+y[j][0]+"/"+y[j][1]+";"
row_val1[i].append(b)
row_val1[3]
import xlsxwriter
work_book = xlsxwriter.Workbook("./after_POS.xlsx")
work_sheet = work_book.add_worksheet()
row=0
col=0
for rownum,author,date,article,art_POS in (row_val1):
work_sheet.write(row,col,rownum)
work_sheet.write(row,col+1,author)
work_sheet.write(row,col+2,date)
work_sheet.write(row,col+3,article)
work_sheet.write(row,col+4,art_POS)
row += 1
work_book.close()