Java Cluster.appendOtherTopics Exemples

Langage de programmation: Java

Espace de nommage/Pack: org.carrot2.core

Class/Type: Cluster

Méthode/Fonction: appendOtherTopics

Exemples au hotexamples.com: 4

Java Cluster.appendOtherTopics - 4 exemples trouvés. Ce sont les exemples réels les mieux notés de org.carrot2.core.Cluster.appendOtherTopics extraits de projets open source. Vous pouvez noter les exemples pour nous aider à en améliorer la qualité.

Méthodes fréquemment utilisées

Afficher Cacher

addDocuments(6)

getSubclusters(5)

appendOtherTopics(4)

addPhrases(4)

getAllDocuments(3)

getLabel(3)

getDocuments(3)

flatten(2)

collectAllDocuments(2)

byReversedWeightedScoreAndSizeComparator(2)

isOtherTopics(2)

setAttribute(2)

size(2)

getAttribute(1)

assignClusterIds(1)

id(1)

setOtherTopics(1)

setScore(1)

Méthodes fréquemment utilisées

addDocuments (6)

getSubclusters (5)

appendOtherTopics (4)

addPhrases (4)

getAllDocuments (3)

getLabel (3)

getDocuments (3)

flatten (2)

collectAllDocuments (2)

byReversedWeightedScoreAndSizeComparator (2)

Méthodes fréquemment utilisées

isOtherTopics (2)

setAttribute (2)

size (2)

getAttribute (1)

assignClusterIds (1)

id (1)

setOtherTopics (1)

setScore (1)

Associées

VertCoord

NBTCompoundTag

RFModel

Kernel32.INSTANCE

LocatableAnnotation

Xoctg_catpage_itm

IConfigDialogContent

TestApplication

AreaAdapter

ConnectController

Related in langs

smooth_path (PHP)

IpnEntity (PHP)

IndexedBitMatrix (C#)

IPDATA_IPv6 (C#)

jround_up (C++)

wxT (C++)

Amount (Go)

Logger (Go)

sha_for (Python)

error (Python)

Exemple #1

0

Afficher le fichier

Fichier : ByFieldClusteringAlgorithm.java Projet : changbai1980/carrot2

/** Performs by URL clustering. */ @Override public void process() throws ProcessingException { final Map<Object, Cluster> clusterMap = Maps.newHashMap(); for (Document document : documents) { final Object field = document.getField(fieldName); if (field instanceof Collection<?>) { for (Object value : (Collection<?>) field) { addToCluster(clusterMap, value, document); } } else { addToCluster(clusterMap, field, document); } } clusters = Lists.newArrayList(clusterMap.values()); Collections.sort(clusters, Cluster.BY_REVERSED_SIZE_AND_LABEL_COMPARATOR); Cluster.appendOtherTopics(documents, clusters); }

Exemple #2

0

Afficher le fichier

Fichier : STCClusteringAlgorithm.java Projet : nkabir/carrot2

/** * Create the junk (unassigned documents) cluster and create the final set of clusters in Carrot2 * format. */ private void postProcessing(ArrayList<ClusterCandidate> clusters) { // Adapt to Carrot2 classes, counting used documents on the way. final BitSet all = new BitSet(documents.size()); final ArrayList<Document> docs = Lists.newArrayListWithCapacity(documents.size()); final ArrayList<String> phrases = Lists.newArrayListWithCapacity(3); for (ClusterCandidate c : clusters) { final Cluster c2 = new Cluster(); c2.addPhrases(collectPhrases(phrases, c)); c2.addDocuments(collectDocuments(docs, c.documents)); c2.setScore((double) c.score); this.clusters.add(c2); all.or(c.documents); docs.clear(); phrases.clear(); } Cluster.appendOtherTopics(this.documents, this.clusters); }

Exemple #3

0

Afficher le fichier

Fichier : Cluster.java Projet : ashish0038/rahasia

/** * If there are unclustered documents, appends the "Other Topics" group to the <code>clusters * </code>. * * @see #buildOtherTopics(List, List) */ public static void appendOtherTopics(List<Document> allDocuments, List<Cluster> clusters) { appendOtherTopics(allDocuments, clusters, OTHER_TOPICS_LABEL); }

Exemple #4

0

Afficher le fichier

Fichier : LingoClusteringAlgorithm.java Projet : kimgungoo/carrot2

/** * Performs the actual clustering with an assumption that all documents are written in one <code> * language</code>. */ private void cluster(LanguageCode language) { // Preprocessing of documents final PreprocessingContext context = preprocessingPipeline.preprocess(documents, query, language); // Further processing only if there are words to process clusters = Lists.newArrayList(); if (context.hasLabels()) { // Term-document matrix building and reduction final VectorSpaceModelContext vsmContext = new VectorSpaceModelContext(context); final ReducedVectorSpaceModelContext reducedVsmContext = new ReducedVectorSpaceModelContext(vsmContext); LingoProcessingContext lingoContext = new LingoProcessingContext(reducedVsmContext); matrixBuilder.buildTermDocumentMatrix(vsmContext); matrixBuilder.buildTermPhraseMatrix(vsmContext); matrixReducer.reduce( reducedVsmContext, computeClusterCount(desiredClusterCountBase, documents.size())); // Cluster label building clusterBuilder.buildLabels(lingoContext, matrixBuilder.termWeighting); // Document assignment clusterBuilder.assignDocuments(lingoContext); // Cluster merging clusterBuilder.merge(lingoContext); // Format final clusters final int[] clusterLabelIndex = lingoContext.clusterLabelFeatureIndex; final BitSet[] clusterDocuments = lingoContext.clusterDocuments; final double[] clusterLabelScore = lingoContext.clusterLabelScore; for (int i = 0; i < clusterLabelIndex.length; i++) { final Cluster cluster = new Cluster(); final int labelFeature = clusterLabelIndex[i]; if (labelFeature < 0) { // Cluster removed during merging continue; } // Add label and score cluster.addPhrases(labelFormatter.format(context, labelFeature)); cluster.setAttribute(Cluster.SCORE, clusterLabelScore[i]); // Add documents final BitSet bs = clusterDocuments[i]; for (int bit = bs.nextSetBit(0); bit >= 0; bit = bs.nextSetBit(bit + 1)) { cluster.addDocuments(documents.get(bit)); } // Add cluster clusters.add(cluster); } Collections.sort(clusters, Cluster.byReversedWeightedScoreAndSizeComparator(scoreWeight)); } Cluster.appendOtherTopics(documents, clusters); }