-
Notifications
You must be signed in to change notification settings - Fork 2
/
Copy pathrun.sh
21 lines (16 loc) · 784 Bytes
/
run.sh
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
#!/bin/bash
inputfile=$1
topicNumber=$2
iterationNumber=$3
numTopPhrases=$4
echo ${green}===filter out high frequent phrases, which are not considered in the model===${reset}
python script/highFreuquentPhrase.py ${inputfile} input/stopPhrases.txt
echo ${green}===build the link information between phrases and words===${reset}
python script/linkInformation.py ${inputfile} input/phrase_score.txt
cd script
#echo ${green}===serialize the input file, to speed up the io of topic modeling===${reset}
#bash runSerializeData.sh ${inputfile}
#echo ${green}===build the invert index for phrases===${reset}
#python buildInvertIndex.py ${inputfile}
echo ${green}===topic modeling on phrases===${reset}
bash runSparseTP.sh ${inputfile} ${topicNumber} ${iterationNumber} ${numTopPhrases}