fix review comments

piskvorky · menshikh-iv · Jan 22, 2018 · Sep 30, 2017 · Oct 2, 2017 · Oct 2, 2017
commit e3a8ebf71fb9f6f8b248bad16d0d94baabf9a28d
diff --git a/gensim/corpora/bleicorpus.py b/gensim/corpora/bleicorpus.py
@@ -41,9 +41,14 @@ def __init__(self, fname, fname_vocab=None):
         Parameters
         ----------
         fname : str
-            File path to Serialized corpus.
+            Path to corpus.
         fname_vocab : str, optional
-            Vocabulary file. If `fname_vocab` is None, searching for the vocab.txt or `fname_vocab`.vocab file.
+            Vocabulary file. If `fname_vocab` is None, searching one of variants:
+
+            * `fname`.vocab
+            * `fname`/vocab.txt
+            * `fname_without_ext`.vocab
+            * `fname_folder`/vocab.txt
 
         Raises
         ------
@@ -120,9 +125,9 @@ def save_corpus(fname, corpus, id2word=None, metadata=False):
         Parameters
         ----------
         fname : str
-            Path to output filename.
+            Path to output file.
         corpus : iterable of iterable of (int, float)
-            Input corpus
+            Input corpus in BoW format.
         id2word : dict of (str, str), optional
             Mapping id -> word for `corpus`.
         metadata : bool, optional
@@ -160,8 +165,8 @@ def save_corpus(fname, corpus, id2word=None, metadata=False):
         return offsets
 
     def docbyoffset(self, offset):
-        """Get document corresponding to `offset`,
-        offset can be given from :meth:`~gensim.corpora.bleicorpus.BleiCorpus.save_corpus`.
+        """Get document corresponding to `offset`.
+        Offset can be given from :meth:`~gensim.corpora.bleicorpus.BleiCorpus.save_corpus`.
 
         Parameters
         ----------

diff --git a/gensim/corpora/csvcorpus.py b/gensim/corpora/csvcorpus.py
@@ -34,7 +34,7 @@ def __init__(self, fname, labels):
         Parameters
         ----------
         fname : str
-            Path to corpus in CSV format.
+            Path to corpus.
         labels : bool
             If True - ignore first column (class labels).
 

diff --git a/gensim/corpora/indexedcorpus.py b/gensim/corpora/indexedcorpus.py
@@ -49,7 +49,7 @@ def __init__(self, fname, index_fname=None):
         Parameters
         ----------
         fname : str
-            Path to indexed corpus.
+            Path to corpus.
         index_fname : str, optional
             Path to index, if not provided - used `fname.index`.
 
@@ -73,9 +73,9 @@ def serialize(serializer, fname, corpus, id2word=None, index_fname=None,
         Parameters
         ----------
         fname : str
-            Path to output filename
+            Path to output file.
         corpus : iterable of iterable of (int, float)
-            Corpus in BoW format
+            Corpus in BoW format.
         id2word : dict of (str, str), optional
             Mapping id -> word.
         index_fname : str, optional

diff --git a/gensim/corpora/svmlightcorpus.py b/gensim/corpora/svmlightcorpus.py
@@ -49,7 +49,7 @@ def __init__(self, fname, store_labels=True):
         Parameters
         ----------
         fname: str
-            Path to corpus in SVMlight format.
+            Path to corpus.
         store_labels : bool, optional
             Whether to store labels (~SVM target class). They currently have no application but stored
             in `self.labels` for convenience by default.
@@ -138,8 +138,8 @@ def docbyoffset(self, offset):
             # TODO: it brakes if gets None from line2doc
 
     def line2doc(self, line):
-        """Get a document from a single line in SVMlight format,
-        inverse of :meth:`~gensim.corpora.svmlightcorpus.SvmLightCorpus.doc2line`.
+        """Get a document from a single line in SVMlight format.
+        This method inverse of :meth:`~gensim.corpora.svmlightcorpus.SvmLightCorpus.doc2line`.
 
         Parameters
         ----------
@@ -166,8 +166,8 @@ def line2doc(self, line):
 
     @staticmethod
     def doc2line(doc, label=0):
-        """Convert BoW representation of document in SVMlight format,
-        inverse of :meth:`~gensim.corpora.svmlightcorpus.SvmLightCorpus.line2doc`.
+        """Convert BoW representation of document in SVMlight format.
+        This method inverse of :meth:`~gensim.corpora.svmlightcorpus.SvmLightCorpus.line2doc`.
 
         Parameters
         ----------

diff --git a/gensim/corpora/wikicorpus.py b/gensim/corpora/wikicorpus.py
@@ -168,7 +168,7 @@ def remove_template(s):
     Parameters
     ----------
     s : str
-        String containing markup template
+        String containing markup template.
 
     Returns
     -------
@@ -250,7 +250,7 @@ def tokenize(content, token_min_len=TOKEN_MIN_LEN, token_max_len=TOKEN_MAX_LEN,
     token_min_len : int
         Minimal token length.
     token_max_len : int
-        Maximal token length
+        Maximal token length.
     lower : bool
          If True - convert `content` to lower case.
 
@@ -299,7 +299,7 @@ def extract_pages(f, filter_namespaces=False):
     f : file
         File-like object.
     filter_namespaces : list of str or bool
-         Namespaces that will be extracted
+         Namespaces that will be extracted.
 
     Yields
     ------
@@ -517,7 +517,7 @@ def get_texts(self):
         Notes
         -----
         This iterates over the **texts**. If you want vectors, just use the standard corpus interface
-        instead of this method
+        instead of this method:
 
         >>> for vec in wiki_corpus:
         >>>     print(vec)