-
Notifications
You must be signed in to change notification settings - Fork 1
/
Copy pathcmd.txt
28 lines (11 loc) · 1.68 KB
/
cmd.txt
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
hadoop jar target/NearDuplicateDetection-1.1-SNAPSHOT.jar org.NearDuplicateDetection.MinHash -input resources/sample.txt -output output-java-mh
spark-submit --class org.NearDuplicateDetection.MinHashS target/NearDuplicateDetection-1.1-SNAPSHOT.jar --input resources/sample.txt --output output-scala-mh
hadoop jar target/NearDuplicateDetection-1.1-SNAPSHOT.jar org.NearDuplicateDetection.RandomProjection -input output_vector.txt -output output-java-rj
mvn exec:java -Dexec.mainClass=org.NearDuplicateDetection.GenerteRandomVectors
spark-submit --class org.NearDuplicateDetection.RandomProjectionS target/NearDuplicateDetection-1.1-SNAPSHOT.jar --input output_vector.txt --output output-scala-rj
hadoop jar target/NearDuplicateDetection-1.1-SNAPSHOT.jar org.NearDuplicateDetection.MinHash -input /Users/lucasmeng/WikiClean/wiki_output.txt -output output-wiki-java-mh
hadoop jar target/NearDuplicateDetection-1.1-SNAPSHOT.jar org.NearDuplicateDetection.MinHash -input cs651-pro/cs651-pro-wiki-new.txt -output cs651-pro-wiki -reducers 16
hadoop jar target/NearDuplicateDetection-1.1-SNAPSHOT.jar org.NearDuplicateDetection.Cluster -input output-java-mh-3 -output output-cluster
hadoop jar target/NearDuplicateDetection-1.1-SNAPSHOT.jar org.NearDuplicateDetection.Cluster -input output-java-rj -output output-cluster-rj
hadoop jar target/NearDuplicateDetection-1.1-SNAPSHOT.jar org.NearDuplicateDetection.Cluster -input cs651-pro-wiki -output output-cluster
spark-submit --class org.NearDuplicateDetection.MinHashS --num-executors 2 --executor-cores 4 --executor-memory 24G target/NearDuplicateDetection-1.1-SNAPSHOT.jar --input cs651-pro/cs651-pro-wiki-new.txt --output cs651-pro-wiki-scala --reducers 16