public static IndianBuffet<String> createTextDocumentSampler(double alpha) { return new IndianBuffet<>(alpha, new WordConverter()); }
@Test public void testBasicText() { RandomUtils.useTestSeed(); IndianBuffet<String> sampler = IndianBuffet.createTextDocumentSampler(30); Multiset<String> counts = HashMultiset.create(); int[] lengths = new int[100]; for (int i = 0; i < 30; i++) { final List<String> doc = sampler.sample(); lengths[doc.size()]++; for (String w : doc) { counts.add(w); } System.out.printf("%s\n", doc); } } }
public static IndianBuffet<Integer> createIntegerDocumentSampler(double alpha) { return new IndianBuffet<>(alpha, new IdentityConverter()); }
public static IndianBuffet<Integer> createIntegerDocumentSampler(double alpha) { return new IndianBuffet<>(alpha, new IdentityConverter()); }
public static IndianBuffet<String> createTextDocumentSampler(double alpha) { return new IndianBuffet<>(alpha, new WordConverter()); }