package com.test.lucene; import java.io.File; import java.io.IOException; import java.io.StringReader; import java.util.Calendar; import org.apache.lucene.analysis.Analyzer; import org.apache.lucene.analysis.standard.StandardAnalyzer; import org.apache.lucene.document.Document; import org.apache.lucene.index.DirectoryReader; import org.apache.lucene.index.IndexReader; import org.apache.lucene.queries.mlt.MoreLikeThis; import org.apache.lucene.queryparser.classic.ParseException; import org.apache.lucene.queryparser.classic.QueryParser; import org.apache.lucene.search.IndexSearcher; import org.apache.lucene.search.Query; import org.apache.lucene.search.ScoreDoc; import org.apache.lucene.search.TopDocs; import org.apache.lucene.store.Directory; import org.apache.lucene.store.FSDirectory; import org.apache.lucene.store.IOContext; import org.apache.lucene.store.RAMDirectory; import org.apache.lucene.util.Version; import de.jetwick.snacktory.HtmlFetcher; import de.jetwick.snacktory.JResult; /** * Testing processing time of FSDirectory and RAMDirectory * using simple and MLT queries * */ public class App { // private static String[] pages = { // "http://insidetv.ew.com/2012/10/15/walking-dead-season-3-premiere-ratings/", // "http://techcrunch.com/2012/10/16/facebook-rd-goes-global-opens-engineering-office-in-london-its-first-outside-the-u-s/", // "http://www.bostondynamics.com/index.html", // "http://www.readwriteweb.com/biz/2012/10/how-hard-is-it-to-get-and-use-a-3d-printer.php", // "http://prettymuchamazing.com/news/album-stream-bat-for-lashes-the-haunted-man"}; // private static String[] pages = { "http://www.lemonde.fr/sciences/article/2012/10/11/serge-haroche-il-y-a-une-contradiction-entre-le-temps-des-politiques-et-le-temps-de-la-recherche_1773818_1650684.html", "http://www.business-angel-france.com/business-angel-france-coup-de-gueule-faut-pas-prendre-les-business-angels-pour-des-mougeons", "http://www.larecherche.fr/content/actualite-sante/article?id=32457", "http://www.lesechos.fr/entreprises-secteurs/tech-medias/actu/0202329311759-open-data-l-etat-cherche-a-monetiser-les-donnees-publiques-500953.php", "http://www.usinenouvelle.com/article/les-pme-poumons-essentiels-de-l-economie-europeenne.N183637"}; private static String[] terms = { "Zombie", "Vampire", "Nigth", "Wolf", "Human"}; private static int factor = 1; private static String[] content = new String[pages.length]; public static void main( String[] args ) { System.out.println("Getting " + pages.length + " pages' content... "); for(int i =0; i