logger.info(getHelp()); System.exit(1); LSSimilarity lss = new LSSimilarity(lsm, size, stemmer); lss.interactive(); float cos = lss.compare("word", "term");
double dot = lss.compare2(vi, vj)[0];
public static void main(String[] args) throws Exception { String logConfig = System.getProperty("log-config"); if (logConfig == null) { logConfig = "log-config.txt"; } PropertyConfigurator.configure(logConfig); if (args.length != 6) { System.out.println( "Usage: java -mx512M eu.fbk.utils.lsa.util.NgramComparator input threshold size dim idf file"); System.exit(1); } File Ut = new File(args[0] + "-Ut"); File Sk = new File(args[0] + "-S"); File r = new File(args[0] + "-row"); File c = new File(args[0] + "-col"); File df = new File(args[0] + "-df"); double threshold = Double.parseDouble(args[1]); int size = Integer.parseInt(args[2]); int dim = Integer.parseInt(args[3]); boolean rescaleIdf = Boolean.parseBoolean(args[4]); LSM lsm = new LSM(Ut, Sk, r, c, df, dim, rescaleIdf); LSSimilarity lss = new LSSimilarity(lsm, size); new NgramComparator(args[5], lss); } // end main } // end NgramComparator
private float[] compareAll(BOW bow, String[] s, LSSimilarity lss) throws IOException, MalformedURLException { URL[] concept = getConceptURL(s); BOW[] bows = new BOW[concept.length]; float[] f = new float[concept.length]; for (int i = 0; i < concept.length; i++) { //logger.info("parsing concept " + concept[i]); bows[i] = new BOW(toText(concept[i])); //logger.info("concept " + bows[i]); //logger.info("size concept " + i + " " + bows[i].size()); f[i] = lss.compare(bow, bows[i]); logger.info(i + ", " + concept[i] + ", " + f[i]); //logger.info(i + " = " + f[i]); } return f; } // end compareAll
LSSimilarity lss = new LSSimilarity(lsm, size);
float f = lss.compare(bow, bows[i]);
LSSimilarity lss = new LSSimilarity(lsm, size); double qt = Double.parseDouble(args[4]);
public WebPageComparator(URL page, URL[] concept, LSSimilarity lss) throws IOException { logger.info("parsing " + page + "..."); BOW bow = new BOW(toText(page)); logger.info("size bow " + bow.size()); BOW[] bows = new BOW[concept.length]; for (int i = 0; i < concept.length; i++) { logger.info("parsing concept " + concept[i]); bows[i] = new BOW(toText(concept[i])); logger.info("size concept " + i + " " + bows[i].size()); float f = lss.compare(bow, bows[i]); logger.info(i + " = " + f); } //logger.info(toText(page)); interactive(concept, bows, lss); } // end constructor
LSSimilarity lss = new LSSimilarity(lsm, size);
private float compare(BOW bow, String[] s, LSSimilarity lss) throws IOException, MalformedURLException { URL[] concept = getConceptURL(s); BOW[] bows = new BOW[concept.length]; float[] f = new float[concept.length]; for (int i = 0; i < concept.length; i++) { //logger.info("parsing concept " + concept[i]); bows[i] = new BOW(toText(concept[i])); //logger.info("concept " + bows[i]); //logger.info("size concept " + i + " " + bows[i].size()); f[i] = lss.compare(bow, bows[i]); logger.info(i + ", " + concept[i] + ", " + f[i]); //logger.info(i + " = " + f[i]); } int i = maxIndex(f); if (i != -1) { logger.info("max = " + concept[i] + ", " + f[i]); return f[i]; } return 0; } // end compare
LSSimilarity lss = new LSSimilarity(lsm, size);