-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathrun.py
32 lines (25 loc) · 1.13 KB
/
run.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
'''
Created on Sep 20, 2016
@author: trideep
'''
import LanguageAnalysis.stackexchange as se
import LanguageAnalysis.filepath as fp
from LanguageAnalysis.data_processing.keyphrases import Keyphrase
from LanguageAnalysis.data_processing.language_sim import LanguageSimilarity
def main(fetch_questions=False,fetch_keyphrases=False,language_similarity=False):
tags = ['javascript','java','mysql','python', 'c++','c','sql','swift','matlab','html']
language_keyphrase_map= {}
if fetch_questions:
se.fetch_questions(page=1, tags=tags,filename=fp.question_file_integrated,write_mode='w')
if fetch_keyphrases:
keyphrase_gen = Keyphrase(integrate_data=True)
keyphrase_gen.create_keyphrases()
language_keyphrase_map = keyphrase_gen.get_keyphrases(topn=30)
keyphrase_gen.save_keyphrases(language_keyphrase_map,fp.question_keyphrases)
if language_similarity:
lang_sim = LanguageSimilarity()
#lang_sim.start_training()
lang_sim.create_lang_similarty_data()
if __name__ == '__main__':
main(fetch_questions= False,fetch_keyphrases=False, language_similarity=True)
pass