cc.mallet.topics
Class LDA
java.lang.Object
cc.mallet.topics.LDA
- All Implemented Interfaces:
- java.io.Serializable
public class LDA
- extends java.lang.Object
- implements java.io.Serializable
Latent Dirichlet Allocation.
- Author:
- Andrew McCallum
- See Also:
- Serialized Form
|
Constructor Summary |
LDA(int numberOfTopics)
|
LDA(int numberOfTopics,
double alphaSum,
double beta)
|
|
Method Summary |
void |
addDocuments(InstanceList additionalDocuments,
int numIterations,
int showTopicsInterval,
int outputModelInterval,
java.lang.String outputModelFilename,
Randoms r)
|
void |
estimate(InstanceList documents,
int numIterations,
int showTopicsInterval,
int outputModelInterval,
java.lang.String outputModelFilename,
Randoms r)
|
void |
estimate(int docIndexStart,
int docIndexLength,
int numIterations,
int showTopicsInterval,
int outputModelInterval,
java.lang.String outputModelFilename,
Randoms r)
|
int[][] |
getDocTopicCounts()
|
InstanceList |
getInstanceList()
|
int[] |
getTokensPerTopic()
|
int[][] |
getTypeTopicCounts()
|
static void |
main(java.lang.String[] args)
|
void |
printDocumentTopics(java.io.File f)
|
void |
printDocumentTopics(java.io.PrintWriter pw)
|
void |
printDocumentTopics(java.io.PrintWriter pw,
double threshold,
int max)
|
void |
printState(java.io.File f)
|
void |
printState(java.io.PrintWriter pw)
|
void |
printTopWords(int numWords,
boolean useNewLines)
|
void |
sampleTopicsForAllDocs(Randoms r)
|
void |
sampleTopicsForDocs(int start,
int length,
Randoms r)
|
void |
write(java.io.File f)
|
| Methods inherited from class java.lang.Object |
clone, equals, finalize, getClass, hashCode, notify, notifyAll, toString, wait, wait, wait |
LDA
public LDA(int numberOfTopics)
LDA
public LDA(int numberOfTopics,
double alphaSum,
double beta)
estimate
public void estimate(InstanceList documents,
int numIterations,
int showTopicsInterval,
int outputModelInterval,
java.lang.String outputModelFilename,
Randoms r)
addDocuments
public void addDocuments(InstanceList additionalDocuments,
int numIterations,
int showTopicsInterval,
int outputModelInterval,
java.lang.String outputModelFilename,
Randoms r)
estimate
public void estimate(int docIndexStart,
int docIndexLength,
int numIterations,
int showTopicsInterval,
int outputModelInterval,
java.lang.String outputModelFilename,
Randoms r)
sampleTopicsForAllDocs
public void sampleTopicsForAllDocs(Randoms r)
sampleTopicsForDocs
public void sampleTopicsForDocs(int start,
int length,
Randoms r)
getDocTopicCounts
public int[][] getDocTopicCounts()
getTypeTopicCounts
public int[][] getTypeTopicCounts()
getTokensPerTopic
public int[] getTokensPerTopic()
printTopWords
public void printTopWords(int numWords,
boolean useNewLines)
printDocumentTopics
public void printDocumentTopics(java.io.File f)
throws java.io.IOException
- Throws:
java.io.IOException
printDocumentTopics
public void printDocumentTopics(java.io.PrintWriter pw)
printDocumentTopics
public void printDocumentTopics(java.io.PrintWriter pw,
double threshold,
int max)
printState
public void printState(java.io.File f)
throws java.io.IOException
- Throws:
java.io.IOException
printState
public void printState(java.io.PrintWriter pw)
write
public void write(java.io.File f)
getInstanceList
public InstanceList getInstanceList()
main
public static void main(java.lang.String[] args)
throws java.io.IOException
- Throws:
java.io.IOException