org.carrot2.core.Cluster.getSubclusters java code examples

  public boolean apply(Cluster cluster)
  {
    return !cluster.getSubclusters().isEmpty();
  }
});

private static List<Cluster> flatten(Collection<Cluster> hierarchical, List<Cluster> flat)
{
  for (Cluster c : hierarchical)
  {
    flat.add(c);
    flatten(c.getSubclusters(), flat);
  }
  return flat;
}

/**
 * Locate the first cluster that has id equal to <code>id</code>. The search includes
 * all the clusters in the input and their sub-clusters. The first cluster with
 * matching identifier is returned or <code>null</code> if no such cluster could be
 * found.
 */
public static Cluster find(int id, Collection<Cluster> clusters)
{
  for (Cluster c : clusters)
  {
    if (c != null)
    {
      if (c.id != null && c.id == id)
      {
        return c;
      }
      if (!c.getSubclusters().isEmpty())
      {
        final Cluster sub = find(id, c.getSubclusters());
        if (sub != null)
        {
          return sub;
        }
      }
    }
  }
  return null;
}

  @Override
  public String toString()
  {
    return "[Cluster, label: " + getLabel() + ", docs: " + size() + ", subclusters: " + getSubclusters().size() + "]";
  }
}

/**
 * Replace document refids with the actual references upon deserialization.
 */
private void documentIdToReference(Cluster cluster, Map<String, Document> documents)
{
  if (cluster.documentIds != null)
  {
    for (Cluster.DocumentRefid documentRefid : cluster.documentIds)
    {
      cluster.addDocuments(documents.get(documentRefid.refid));
    }
  }
  for (Cluster subcluster : cluster.getSubclusters())
  {
    documentIdToReference(subcluster, documents);
  }
}

/**
 * A recursive routine for collecting unique documents from this cluster and
 * subclusters.
 */
private static Set<Document> collectAllDocuments(Cluster cluster, Set<Document> docs)
{
  if (cluster == null)
  {
    return docs;
  }
  docs.addAll(cluster.getDocuments());
  final List<Cluster> subclusters = cluster.getSubclusters();
  for (final Cluster subcluster : subclusters)
  {
    collectAllDocuments(subcluster, docs);
  }
  return docs;
}

private void clustersToNamedList(List<Cluster> outputClusters,
                 List parent, boolean outputSubClusters, int maxLabels) {
 for (Cluster outCluster : outputClusters) {
  NamedList cluster = new SimpleOrderedMap();
  parent.add(cluster);
  List<String> labels = outCluster.getPhrases();
  if (labels.size() > maxLabels)
   labels = labels.subList(0, maxLabels);
  cluster.add("labels", labels);
  List<Document> docs = outputSubClusters ? outCluster.getDocuments() : outCluster.getAllDocuments();
  List docList = new ArrayList();
  cluster.add("docs", docList);
  for (Document doc : docs) {
   docList.add(doc.getField("solrId"));
  }
  if (outputSubClusters) {
   List subclusters = new ArrayList();
   cluster.add("clusters", subclusters);
   clustersToNamedList(outCluster.getSubclusters(), subclusters,
       outputSubClusters, maxLabels);
  }
 }
}

  private static List<Cluster> sanityCheck(List<Cluster> in, Predicate<Document> docFilter)
  {
    List<Cluster> cloned = Lists.newArrayListWithCapacity(in.size());
    for (Cluster c : in) {
      Cluster c2 = new Cluster();
      c2.addPhrases(c.getPhrases());
      c2.addDocuments(
        Iterables.filter(c.getDocuments(), docFilter));
      c2.addSubclusters(sanityCheck(c.getSubclusters(), docFilter));
      cloned.add(c2);
    }
    return cloned;
  }    
}

if (outputSubClusters && !outCluster.getSubclusters().isEmpty()) {
 List<NamedList<Object>> subclusters = new ArrayList<>();
 cluster.add("clusters", subclusters);
 clustersToNamedList(outCluster.getSubclusters(), subclusters,
     outputSubClusters, maxLabels);

for (Cluster cluster : clusters)
  final List<Cluster> subclusters = cluster.getSubclusters();
  for (Cluster subcluster : subclusters)
    flattenedClusters.addAll(majorLanguageCluster.getSubclusters());

clusterLabel = subcluster.getPhrases().get(0);
cluster.addDocuments(subcluster.getDocuments());
cluster.addSubclusters(subcluster.getSubclusters());

Javadoc

Returns all subclusters of this cluster. The returned list is unmodifiable.

Popular methods of Cluster

getAllDocuments
Returns all documents in this cluster ordered according to the provided comparator. See Document for
getDocuments
Returns all documents contained in this cluster. The returned list is unmodifiable.
getPhrases
Returns all phrases describing this cluster. The returned list is unmodifiable.
getLabel
Formats this cluster's label. If there is more than one phrase describing this cluster, phrases will
isOtherTopics
Returns true if this cluster is the #OTHER_TOPICS cluster.
<init>
Creates a Cluster with the provided phrase to be used as the cluster's label and documents containe
addDocuments
Adds document to this cluster.
addPhrases
Adds phrases to the description of this cluster.
addSubclusters
Adds subclusters to this cluster
appendOtherTopics
If there are unclustered documents, appends the "Other Topics" group to the clusters.
assignClusterIds
Assigns sequential identifiers to the provided clusters (and their sub-clusters). If any cluster alr
buildOtherTopics
Builds an "Other Topics" cluster that groups those documents fromallDocument that were not referenc

Popular in Java

Making http post requests using okhttp
getOriginalFilename (MultipartFile)
Return the original filename in the client's filesystem.This may contain path information depending
putExtra (Intent)
onRequestPermissionsResult (Fragment)
EOFException (java.io)
Thrown when a program encounters the end of a file or stream during an input operation.
ByteBuffer (java.nio)
A buffer for bytes. A byte buffer can be created in either one of the following ways: * #allocate
Executor (java.util.concurrent)
An object that executes submitted Runnable tasks. This interface provides a way of decoupling task s
Logger (org.slf4j)
The org.slf4j.Logger interface is the main user entry point of SLF4J API. It is expected that loggin
JList (javax.swing)
Get (org.apache.hadoop.hbase.client)
Used to perform Get operations on a single row. To get everything for a row, instantiate a Get objec
Github Copilot alternatives

How to use getSubclustersmethodin org.carrot2.core.Cluster

Best Java code snippets using org.carrot2.core.Cluster.getSubclusters (Showing top 11 results out of 315)

How to use
getSubclusters
method
in
org.carrot2.core.Cluster