Source code for InfoR.Examples.example
import sys
from InfoR.VectorSpaceModels import VSM
from InfoR.LanguageModels import LanguageModel
from InfoR.ProbabilitisticModels import ProbModel
[docs]def Corpus():
print "The default data set is the corpus of my answers on Quora."
print "The answers can be seen at https://www.quora.com/Janu-Verma-2/answers"
print "I answer questions on a varied range of topics and this would a good example for text analytics. "
Corpus()
directory = "Data"
# Search Query
q = "mathematical physicist edward witten"
print "The search query is - " + q
# Number of docs to be retrieved
n_docs = 5
print "Number of documents to be retrieved - " + str(n_docs)
[docs]def vsm():
out = VSM(directory)
print "Search Results based on Frequency Counts : \n"
print out.search(q,n_docs)
print "Search Results based on tf-idf vectors : \n"
print out.search(q,n_docs, tf_idf=True)
print "Search Results based on tf-idf after performing LSA : \n"
print "The number of LSA compnents is 3."
print out.search(q,n_docs, tf_idf=True, LSA=True, n_comp=3)
def LM():
out = LanguageModel(directory)
print "Search Results from Language Models: \n"
print out.search(q,n_docs)
[docs]def LM():
out = ProbModel(directory)
print "Search Results from Probabilitistic Models: \n"
print out.search(q,n_docs)