|
@@ -0,0 +1,42 @@
|
|
1
|
+from konlpy.tag import Kkma
|
|
2
|
+import os
|
|
3
|
+import sys
|
|
4
|
+import urllib.request
|
|
5
|
+import json
|
|
6
|
+import re
|
|
7
|
+
|
|
8
|
+def naver_blog_search(client_id, client_secret, text):
|
|
9
|
+ encText = urllib.parse.quote(text)
|
|
10
|
+ url = "https://openapi.naver.com/v1/search/blog?query=" + encText # json 결과
|
|
11
|
+ # url = "https://openapi.naver.com/v1/search/blog.xml?query=" + encText # xml 결과
|
|
12
|
+ request = urllib.request.Request(url)
|
|
13
|
+ request.add_header("X-Naver-Client-Id",client_id)
|
|
14
|
+ request.add_header("X-Naver-Client-Secret",client_secret)
|
|
15
|
+ response = urllib.request.urlopen(request)
|
|
16
|
+ rescode = response.getcode()
|
|
17
|
+ if(rescode==200):
|
|
18
|
+ response_body = response.read()
|
|
19
|
+ return response_body.decode('utf-8')
|
|
20
|
+ else:
|
|
21
|
+ print("Error Code:" + rescode)
|
|
22
|
+
|
|
23
|
+def striphtml(data):
|
|
24
|
+ p = re.compile(r'<.*?>')
|
|
25
|
+ return p.sub('', data)
|
|
26
|
+
|
|
27
|
+result = []
|
|
28
|
+kkma = Kkma()
|
|
29
|
+naver_result = naver_blog_search('OJgN42xxZiJXpnZtCH1j', 'crXggqJhhW', '코딩')
|
|
30
|
+y = json.loads(naver_result)
|
|
31
|
+for b in y['items']:
|
|
32
|
+ for word, pos in kkma.pos(striphtml(b['description'])):
|
|
33
|
+ if pos == 'NNG' or pos == 'NNP':
|
|
34
|
+ result.append(word)
|
|
35
|
+
|
|
36
|
+words = set(result)
|
|
37
|
+loofWords = list(words)
|
|
38
|
+countList = []
|
|
39
|
+for b in loofWords:
|
|
40
|
+ if result.count(b) > 1:
|
|
41
|
+ countList.append([b, result.count(b)])
|
|
42
|
+print(countList)
|