Add files via upload

박은주
Commit a68f287e6c445d99595dab655427c8fbaa0e58f6 a68f287e 1 parent 30515d6a
Showing 1 changed file with 25 additions and 0 deletions
GetTopic.py
--- a/GetTopic.py 0 → 100644
View file @a68f287
+++ b/GetTopic.py 0 → 100644
View file @a68f287
+import os
+import csv
+
+from sklearn.metrics.pairwise import cosine_similarity
+from sklearn.feature_extraction.text import TfidfVectorizer
+from sklearn.cluster import KMeans
+from konlpy.tag import Okt
+
+okt = Okt()
+def DocToNouns(docs):
+    return [{
+        'id': i,
+        'nouns': ' '.join(okt.nouns(doc)),
+    } for i, doc in enumerate(docs)]
+
+BASE_DIR = os.path.dirname(os.path.abspath(__file__))
+
+posts = []
+with open(os.path.join(BASE_DIR + '/', 'data.csv'), 'r', encoding='utf-8-sig') as db:
+    reader = csv.reader(db)
+    for data in reader:
+        posts.append(data)
+
+nouns = DocToNouns(posts)
+print(nouns)
\ No newline at end of file