private float[] compareAll(BOW bow, String[] s, LSSimilarity lss) throws IOException, MalformedURLException { URL[] concept = getConceptURL(s); BOW[] bows = new BOW[concept.length]; float[] f = new float[concept.length]; for (int i = 0; i < concept.length; i++) { //logger.info("parsing concept " + concept[i]); bows[i] = new BOW(toText(concept[i])); //logger.info("concept " + bows[i]); //logger.info("size concept " + i + " " + bows[i].size()); f[i] = lss.compare(bow, bows[i]); logger.info(i + ", " + concept[i] + ", " + f[i]); //logger.info(i + " = " + f[i]); } return f; } // end compareAll
float f = lss.compare(bow, bows[i]);
float cos = lss.compare("word", "term");
public WebPageComparator(URL page, URL[] concept, LSSimilarity lss) throws IOException { logger.info("parsing " + page + "..."); BOW bow = new BOW(toText(page)); logger.info("size bow " + bow.size()); BOW[] bows = new BOW[concept.length]; for (int i = 0; i < concept.length; i++) { logger.info("parsing concept " + concept[i]); bows[i] = new BOW(toText(concept[i])); logger.info("size concept " + i + " " + bows[i].size()); float f = lss.compare(bow, bows[i]); logger.info(i + " = " + f); } //logger.info(toText(page)); interactive(concept, bows, lss); } // end constructor
private float compare(BOW bow, String[] s, LSSimilarity lss) throws IOException, MalformedURLException { URL[] concept = getConceptURL(s); BOW[] bows = new BOW[concept.length]; float[] f = new float[concept.length]; for (int i = 0; i < concept.length; i++) { //logger.info("parsing concept " + concept[i]); bows[i] = new BOW(toText(concept[i])); //logger.info("concept " + bows[i]); //logger.info("size concept " + i + " " + bows[i].size()); f[i] = lss.compare(bow, bows[i]); logger.info(i + ", " + concept[i] + ", " + f[i]); //logger.info(i + " = " + f[i]); } int i = maxIndex(f); if (i != -1) { logger.info("max = " + concept[i] + ", " + f[i]); return f[i]; } return 0; } // end compare