Permalink
Browse files

added UCI corpus docs

  • Loading branch information...
1 parent ebe07e7 commit 28d887b654d2d231ee2da4a4bcff004b9d327a65 @piskvorky piskvorky committed Mar 8, 2012
Showing with 401 additions and 75 deletions.
  1. +1 −0 docs/_sources/apiref.txt
  2. +8 −0 docs/_sources/corpora/ucicorpus.txt
  3. +1 −1 docs/_sources/index.txt
  4. +1 −1 docs/about.html
  5. +2 −1 docs/apiref.html
  6. +1 −1 docs/changes_080.html
  7. +1 −1 docs/corpora/bleicorpus.html
  8. +1 −1 docs/corpora/corpora.html
  9. +1 −1 docs/corpora/dictionary.html
  10. +6 −6 docs/corpora/indexedcorpus.html
  11. +2 −2 docs/corpora/lowcorpus.html
  12. +1 −1 docs/corpora/mmcorpus.html
  13. +1 −1 docs/corpora/svmlightcorpus.html
  14. +6 −6 docs/corpora/textcorpus.html
  15. +259 −0 docs/corpora/ucicorpus.html
  16. +1 −1 docs/corpora/wikicorpus.html
  17. +1 −1 docs/dist_lda.html
  18. +1 −1 docs/dist_lsi.html
  19. +1 −1 docs/distributed.html
  20. +57 −7 docs/genindex.html
  21. +2 −9 docs/index.html
  22. +1 −1 docs/install.html
  23. +1 −1 docs/interfaces.html
  24. +1 −1 docs/intro.html
  25. +1 −1 docs/matutils.html
  26. +1 −1 docs/models/hdpmodel.html
  27. +1 −1 docs/models/lda_dispatcher.html
  28. +1 −1 docs/models/lda_worker.html
  29. +1 −1 docs/models/ldamodel.html
  30. +1 −1 docs/models/logentropy_model.html
  31. +1 −1 docs/models/lsi_dispatcher.html
  32. +1 −1 docs/models/lsi_worker.html
  33. +1 −1 docs/models/lsimodel.html
  34. +1 −1 docs/models/models.html
  35. +1 −1 docs/models/rpmodel.html
  36. +1 −1 docs/models/tfidfmodel.html
  37. BIN docs/objects.inv
  38. +6 −1 docs/py-modindex.html
  39. +1 −1 docs/search.html
  40. +1 −1 docs/searchindex.js
  41. +1 −1 docs/similarities/docsim.html
  42. +1 −1 docs/similarities/simserver.html
  43. +1 −1 docs/simserver.html
  44. +1 −0 docs/src/apiref.rst
  45. +2 −2 docs/src/conf.py
  46. +8 −0 docs/src/corpora/ucicorpus.rst
  47. +1 −1 docs/src/index.rst
  48. +1 −1 docs/tut1.html
  49. +1 −1 docs/tut2.html
  50. +1 −1 docs/tut3.html
  51. +1 −1 docs/tutorial.html
  52. +1 −1 docs/utils.html
  53. +1 −1 docs/wiki.html
  54. +1 −1 gensim/corpora/ucicorpus.py
  55. +1 −1 setup.py
View
@@ -18,6 +18,7 @@ Modules:
corpora/svmlightcorpus
corpora/wikicorpus
corpora/textcorpus
+ corpora/ucicorpus
corpora/indexedcorpus
models/ldamodel
models/lsimodel
@@ -0,0 +1,8 @@
+:mod:`corpora.ucicorpus` -- Corpus in UCI bag-of-words format
+==============================================================================================================
+
+.. automodule:: gensim.corpora.ucicorpus
+ :synopsis: Corpus in University of California, Irvine (UCI) bag-of-words format
+ :members:
+ :inherited-members:
+
View
@@ -44,7 +44,7 @@ Quick Reference Example
.. admonition:: What's new?
-
+ * 8 Mar 2012: release 0.8.4: `Hierarchical Dirichlet Process <http://radimrehurek.com/gensim/models/hdpmodel.html>`_
* 2 Dec 2011: bug-fix release 0.8.3 out; `CHANGELOG <https://github.com/piskvorky/gensim/blob/develop/CHANGELOG.txt>`_
* 1 Dec 2011: released `simserver <http://pypi.python.org/pypi/simserver>`_, a Python document similarity server based on gensim
View
@@ -16,7 +16,7 @@
<script type="text/javascript">
var DOCUMENTATION_OPTIONS = {
URL_ROOT: '',
- VERSION: '0.8.3',
+ VERSION: '0.8.4',
COLLAPSE_INDEX: false,
FILE_SUFFIX: '.html',
HAS_SOURCE: true
View
@@ -16,7 +16,7 @@
<script type="text/javascript">
var DOCUMENTATION_OPTIONS = {
URL_ROOT: '',
- VERSION: '0.8.3',
+ VERSION: '0.8.4',
COLLAPSE_INDEX: false,
FILE_SUFFIX: '.html',
HAS_SOURCE: true
@@ -126,6 +126,7 @@
<li class="toctree-l1"><a class="reference internal" href="corpora/svmlightcorpus.html"><tt class="docutils literal"><span class="pre">corpora.svmlightcorpus</span></tt> &#8211; Corpus in SVMlight format</a></li>
<li class="toctree-l1"><a class="reference internal" href="corpora/wikicorpus.html"><tt class="docutils literal"><span class="pre">corpora.wikicorpus</span></tt> &#8211; Corpus from a Wikipedia dump</a></li>
<li class="toctree-l1"><a class="reference internal" href="corpora/textcorpus.html"><tt class="docutils literal"><span class="pre">corpora.textcorpus</span></tt> &#8211; Building corpora with dictionaries</a></li>
+<li class="toctree-l1"><a class="reference internal" href="corpora/ucicorpus.html"><tt class="docutils literal"><span class="pre">corpora.ucicorpus</span></tt> &#8211; Corpus in UCI bag-of-words format</a></li>
<li class="toctree-l1"><a class="reference internal" href="corpora/indexedcorpus.html"><tt class="docutils literal"><span class="pre">corpora.indexedcorpus</span></tt> &#8211; Random access to corpus documents</a></li>
<li class="toctree-l1"><a class="reference internal" href="models/ldamodel.html"><tt class="docutils literal"><span class="pre">models.ldamodel</span></tt> &#8211; Latent Dirichlet Allocation</a></li>
<li class="toctree-l1"><a class="reference internal" href="models/lsimodel.html"><tt class="docutils literal"><span class="pre">models.lsimodel</span></tt> &#8211; Latent Semantic Indexing</a></li>
View
@@ -16,7 +16,7 @@
<script type="text/javascript">
var DOCUMENTATION_OPTIONS = {
URL_ROOT: '',
- VERSION: '0.8.3',
+ VERSION: '0.8.4',
COLLAPSE_INDEX: false,
FILE_SUFFIX: '.html',
HAS_SOURCE: true
@@ -16,7 +16,7 @@
<script type="text/javascript">
var DOCUMENTATION_OPTIONS = {
URL_ROOT: '../',
- VERSION: '0.8.3',
+ VERSION: '0.8.4',
COLLAPSE_INDEX: false,
FILE_SUFFIX: '.html',
HAS_SOURCE: true
@@ -16,7 +16,7 @@
<script type="text/javascript">
var DOCUMENTATION_OPTIONS = {
URL_ROOT: '../',
- VERSION: '0.8.3',
+ VERSION: '0.8.4',
COLLAPSE_INDEX: false,
FILE_SUFFIX: '.html',
HAS_SOURCE: true
@@ -16,7 +16,7 @@
<script type="text/javascript">
var DOCUMENTATION_OPTIONS = {
URL_ROOT: '../',
- VERSION: '0.8.3',
+ VERSION: '0.8.4',
COLLAPSE_INDEX: false,
FILE_SUFFIX: '.html',
HAS_SOURCE: true
@@ -16,7 +16,7 @@
<script type="text/javascript">
var DOCUMENTATION_OPTIONS = {
URL_ROOT: '../',
- VERSION: '0.8.3',
+ VERSION: '0.8.4',
COLLAPSE_INDEX: false,
FILE_SUFFIX: '.html',
HAS_SOURCE: true
@@ -29,7 +29,7 @@
<link rel="top" title="gensim" href="../index.html" />
<link rel="up" title="API Reference" href="../apiref.html" />
<link rel="next" title="models.ldamodel – Latent Dirichlet Allocation" href="../models/ldamodel.html" />
- <link rel="prev" title="corpora.textcorpusBuilding corpora with dictionaries" href="textcorpus.html" />
+ <link rel="prev" title="corpora.ucicorpusCorpus in University of California, Irvine (UCI) bag-of-words format" href="ucicorpus.html" />
<!-- twitter search widget
@@ -68,7 +68,7 @@
<a href="../models/ldamodel.html" title="models.ldamodel – Latent Dirichlet Allocation"
accesskey="N">next</a> |</li>
<li class="right" >
- <a href="textcorpus.html" title="corpora.textcorpusBuilding corpora with dictionaries"
+ <a href="ucicorpus.html" title="corpora.ucicorpusCorpus in University of California, Irvine (UCI) bag-of-words format"
accesskey="P">previous</a> |</li>
<li><a href="../index.html">Gensim home</a>|&nbsp;</li>
<li><a href="../tutorial.html">Tutorials</a>|&nbsp;</li>
@@ -84,8 +84,8 @@
<div class="sphinxsidebar">
<div class="sphinxsidebarwrapper">
<h4>Previous topic</h4>
- <p class="topless"><a href="textcorpus.html"
- title="previous chapter"><tt class="docutils literal"><span class="pre">corpora.textcorpus</span></tt> &#8211; Building corpora with dictionaries</a></p>
+ <p class="topless"><a href="ucicorpus.html"
+ title="previous chapter"><tt class="docutils literal"><span class="pre">corpora.ucicorpus</span></tt> &#8211; Corpus in University of California, Irvine (UCI) bag-of-words format</a></p>
<h4>Next topic</h4>
<p class="topless"><a href="../models/ldamodel.html"
title="next chapter"><tt class="docutils literal"><span class="pre">models.ldamodel</span></tt> &#8211; Latent Dirichlet Allocation</a></p>
@@ -222,7 +222,7 @@
<a href="../models/ldamodel.html" title="models.ldamodel – Latent Dirichlet Allocation"
>next</a> |</li>
<li class="right" >
- <a href="textcorpus.html" title="corpora.textcorpusBuilding corpora with dictionaries"
+ <a href="ucicorpus.html" title="corpora.ucicorpusCorpus in University of California, Irvine (UCI) bag-of-words format"
>previous</a> |</li>
<li><a href="../index.html">Gensim home</a>|&nbsp;</li>
<li><a href="../tutorial.html">Tutorials</a>|&nbsp;</li>
@@ -16,7 +16,7 @@
<script type="text/javascript">
var DOCUMENTATION_OPTIONS = {
URL_ROOT: '../',
- VERSION: '0.8.3',
+ VERSION: '0.8.4',
COLLAPSE_INDEX: false,
FILE_SUFFIX: '.html',
HAS_SOURCE: true
@@ -118,7 +118,7 @@
<p>Corpus in GibbsLda++ format of List-Of-Words.</p>
<dl class="class">
<dt id="gensim.corpora.lowcorpus.LowCorpus">
-<em class="property">class </em><tt class="descclassname">gensim.corpora.lowcorpus.</tt><tt class="descname">LowCorpus</tt><big>(</big><em>fname</em>, <em>id2word=None</em>, <em>line2words=&lt;function split_on_space at 0x27a21f0&gt;</em><big>)</big><a class="headerlink" href="#gensim.corpora.lowcorpus.LowCorpus" title="Permalink to this definition">¶</a></dt>
+<em class="property">class </em><tt class="descclassname">gensim.corpora.lowcorpus.</tt><tt class="descname">LowCorpus</tt><big>(</big><em>fname</em>, <em>id2word=None</em>, <em>line2words=&lt;function split_on_space at 0x27a21b0&gt;</em><big>)</big><a class="headerlink" href="#gensim.corpora.lowcorpus.LowCorpus" title="Permalink to this definition">¶</a></dt>
<dd><p>List_Of_Words corpus handles input in GibbsLda++ format.</p>
<p>Quoting <a class="reference external" href="http://gibbslda.sourceforge.net/#3.2_Input_Data_Format">http://gibbslda.sourceforge.net/#3.2_Input_Data_Format</a>:</p>
<div class="highlight-python"><pre>Both data for training/estimating the model and new data (i.e., previously
@@ -16,7 +16,7 @@
<script type="text/javascript">
var DOCUMENTATION_OPTIONS = {
URL_ROOT: '../',
- VERSION: '0.8.3',
+ VERSION: '0.8.4',
COLLAPSE_INDEX: false,
FILE_SUFFIX: '.html',
HAS_SOURCE: true
@@ -16,7 +16,7 @@
<script type="text/javascript">
var DOCUMENTATION_OPTIONS = {
URL_ROOT: '../',
- VERSION: '0.8.3',
+ VERSION: '0.8.4',
COLLAPSE_INDEX: false,
FILE_SUFFIX: '.html',
HAS_SOURCE: true
@@ -16,7 +16,7 @@
<script type="text/javascript">
var DOCUMENTATION_OPTIONS = {
URL_ROOT: '../',
- VERSION: '0.8.3',
+ VERSION: '0.8.4',
COLLAPSE_INDEX: false,
FILE_SUFFIX: '.html',
HAS_SOURCE: true
@@ -28,7 +28,7 @@
<link rel="author" title="About these documents" href="../about.html" />
<link rel="top" title="gensim" href="../index.html" />
<link rel="up" title="API Reference" href="../apiref.html" />
- <link rel="next" title="corpora.indexedcorpusRandom access to corpus documents" href="indexedcorpus.html" />
+ <link rel="next" title="corpora.ucicorpusCorpus in University of California, Irvine (UCI) bag-of-words format" href="ucicorpus.html" />
<link rel="prev" title="corpora.wikicorpus – Corpus from a Wikipedia dump" href="wikicorpus.html" />
@@ -65,7 +65,7 @@
<a href="../py-modindex.html" title="Python Module Index"
>modules</a> |</li>
<li class="right" >
- <a href="indexedcorpus.html" title="corpora.indexedcorpusRandom access to corpus documents"
+ <a href="ucicorpus.html" title="corpora.ucicorpusCorpus in University of California, Irvine (UCI) bag-of-words format"
accesskey="N">next</a> |</li>
<li class="right" >
<a href="wikicorpus.html" title="corpora.wikicorpus – Corpus from a Wikipedia dump"
@@ -87,8 +87,8 @@
<p class="topless"><a href="wikicorpus.html"
title="previous chapter"><tt class="docutils literal docutils literal"><span class="pre">corpora.wikicorpus</span></tt> &#8211; Corpus from a Wikipedia dump</a></p>
<h4>Next topic</h4>
- <p class="topless"><a href="indexedcorpus.html"
- title="next chapter"><tt class="docutils literal docutils literal"><span class="pre">corpora.indexedcorpus</span></tt> &#8211; Random access to corpus documents</a></p>
+ <p class="topless"><a href="ucicorpus.html"
+ title="next chapter"><tt class="docutils literal docutils literal"><span class="pre">corpora.ucicorpus</span></tt> &#8211; Corpus in University of California, Irvine (UCI) bag-of-words format</a></p>
<div id="searchbox" style="display: none">
<h3>Quick search</h3>
<form class="search" action="../search.html" method="get">
@@ -213,7 +213,7 @@
<a href="../py-modindex.html" title="Python Module Index"
>modules</a> |</li>
<li class="right" >
- <a href="indexedcorpus.html" title="corpora.indexedcorpusRandom access to corpus documents"
+ <a href="ucicorpus.html" title="corpora.ucicorpusCorpus in University of California, Irvine (UCI) bag-of-words format"
>next</a> |</li>
<li class="right" >
<a href="wikicorpus.html" title="corpora.wikicorpus – Corpus from a Wikipedia dump"
Oops, something went wrong.

0 comments on commit 28d887b

Please sign in to comment.