diff --git a/.circleci/config.yml b/.circleci/config.yml
deleted file mode 100644
index 1071aa5aeb..0000000000
--- a/.circleci/config.yml
+++ /dev/null
@@ -1,48 +0,0 @@
-version: 2
-jobs:
-  build:
-    docker:
-      - image: cimg/python:3.8.11
-
-    working_directory: ~/gensim
-
-    steps:
-      - checkout
-
-      - restore_cache:
-          key: pip-cache
-
-      - run:
-          name: Apt install (for latex render)
-          command: |
-            sudo apt-get -yq update
-            sudo apt-get -yq remove texlive-binaries --purge
-            sudo apt-get -yq --no-install-suggests --no-install-recommends --force-yes install dvipng texlive-latex-base texlive-latex-extra texlive-latex-recommended texlive-latex-extra texlive-fonts-recommended latexmk
-            sudo apt-get -yq install build-essential python3.8-dev
-
-      - run:
-          name: Basic installation (tox)
-          command: |
-            python3.8 -m virtualenv venv
-            source venv/bin/activate
-            pip install tox --progress-bar off
-
-      - run:
-          name: Build documentation
-          environment:
-            TOX_PARALLEL_NO_SPINNER: 1
-            TOX_PIP_OPTS: --progress-bar=off
-          command: |
-            source venv/bin/activate
-            tox -e compile,docs -vv
-
-      - store_artifacts:
-          path:  docs/src/_build
-          destination: documentation
-
-      - save_cache:
-          key: pip-cache
-          paths:
-            - "~/.cache/pip"
-            - "~/.ccache"
-            - "~/.pip-cache"
diff --git a/.github/workflows/build-wheels.yml b/.github/workflows/build-wheels.yml
index ff304ea1c7..42f61bb8b2 100644
--- a/.github/workflows/build-wheels.yml
+++ b/.github/workflows/build-wheels.yml
@@ -10,6 +10,7 @@ on:
 
 jobs:
   build:
+    timeout-minutes: 30
     runs-on: ${{ matrix.os }}
     defaults:
       run:
diff --git a/.github/workflows/tests.yml b/.github/workflows/tests.yml
index 530aff2683..f09b21d61d 100644
--- a/.github/workflows/tests.yml
+++ b/.github/workflows/tests.yml
@@ -6,8 +6,79 @@ on:
     branches: [ develop ]
 
 jobs:
+  linters:
+    runs-on: ubuntu-latest
+    steps:
+      - uses: actions/checkout@v2
+
+      - name: Setup up Python ${{ matrix.python }}
+        uses: actions/setup-python@v2
+        with:
+          python-version: ${{ matrix.python }}
+
+      - name: Update pip
+        run: python -m pip install -U pip
+
+      - name: Install dependencies
+        run: python -m pip install flake8 flake8-rst
+
+      - name: Run flake8 linter (source)
+        run: flake8 --ignore E12,W503 --max-line-length 120 --show-source gensim
+
+      # - name: Run flake8 linter (documentation)
+      #   run: flake8 --ignore E202,E402,E302,E305,F821 --max-line-length 120 --filename '*.py,*.rst' docs
+
+  docs:
+    name: build documentation
+    timeout-minutes: 10
+    runs-on: ubuntu-20.04
+    defaults:
+      run:
+        shell: bash
+
+    #
+    # Don't run this job unless the linters have succeeded.
+    # It's wasteful to test code that failed to lint, because it'll get
+    # re-tested once the lint errors are fixed.
+    #
+    needs: [linters]
+
+    steps:
+      - uses: actions/checkout@v2
+      - name: Setup up Python ${{ matrix.python }}
+        uses: actions/setup-python@v2
+        with:
+          #
+          # We use Py3.8 here for historical reasons.
+          #
+          python-version: "3.8"
+
+      - name: Update pip
+        run: python -m pip install -U pip
+
+      - name: Install apt packages for LaTeX rendering
+        run: |
+          sudo apt-get -yq update
+          sudo apt-get -yq remove texlive-binaries --purge
+          sudo apt-get -yq --no-install-suggests --no-install-recommends --force-yes install dvipng texlive-latex-base texlive-latex-extra texlive-latex-recommended texlive-latex-extra texlive-fonts-recommended latexmk
+          sudo apt-get -yq install build-essential python3.8-dev
+
+      - name: Install gensim and its dependencies
+        run: pip install -e .[docs]
+
+      - name: Build documentation
+        run: |
+          python setup.py build_ext --inplace
+          make -C docs/src clean html
+
+      #
+      # FIXME: do we want to store the built documentation somewhere, or is
+      # knowing that the docs built successfully enough?
+      #
+
   tests:
-    name: ${{ matrix.name }}
+    name: test ${{ matrix.os }} python ${{ matrix.python }}
+    timeout-minutes: 30
     runs-on: ${{ matrix.os }}
     defaults:
       run:
@@ -16,17 +87,22 @@ jobs:
       fail-fast: false
       matrix:
         include:
-          - {name: Linux, python: 3.7, os: ubuntu-20.04, tox: 'flake8,flake8-docs'}
-          - {name: Linux, python: 3.7, os: ubuntu-20.04, tox: 'py37-linux'}
-          - {name: Linux, python: 3.8, os: ubuntu-20.04, tox: 'py38-linux-cov'}
-          - {name: Linux, python: 3.9, os: ubuntu-20.04, tox: 'py39-linux'}
-          - {name: Linux, python: '3.10', os: ubuntu-20.04, tox: 'py310-linux'}
-          - {name: Windows, python: 3.7, os: windows-2019, tox: 'py37-win'}
-          - {name: Windows, python: 3.8, os: windows-2019, tox: 'py38-win'}
-          - {name: Windows, python: 3.9, os: windows-2019, tox: 'py39-win'}
-          - {name: Windows, python: '3.10', os: windows-2019, tox: 'py310-win'}
-    env:
-      TOX_PARALLEL_NO_SPINNER: 1
+          - {python: 3.7, os: ubuntu-20.04}
+          - {python: 3.8, os: ubuntu-20.04}
+          - {python: 3.9, os: ubuntu-20.04}
+          - {python: '3.10', os: ubuntu-20.04, coverage: true}
+
+          - {python: 3.7, os: windows-2019}
+          - {python: 3.8, os: windows-2019}
+          - {python: 3.9, os: windows-2019}
+          - {python: '3.10', os: windows-2019}
+
+    #
+    # Don't run this job unless the linters have succeeded.
+    # It's wasteful to test code that failed to lint, because it'll get
+    # re-tested once the lint errors are fixed.
+    #
+    needs: [linters]
 
     steps:
       - uses: actions/checkout@v2
@@ -50,25 +126,48 @@ jobs:
           curl -sL "https://keyserver.ubuntu.com/pks/lookup?op=get&search=0x2EE0EA64E40A89B84B2DF73499E82A75642AC823" | sudo apt-key add
           sudo apt-get update -y
           sudo apt-get install -y sbt
-      - name: Install tox
-        run: pip install tox
+
       - name: Install GDB & enable core dumps
         if: matrix.os == 'ubuntu-20.04'
         run: |
           sudo apt-get update -y
           sudo apt-get install -y gdb
           ulimit -c unlimited -S  # enable core dumps
-      - name: Run tox tests
-        run: tox -e ${{ matrix.tox }}
+
+      - name: Install gensim and its dependencies
+        if: matrix.os != 'windows'
+        run: pip install -e .[test]
+
+      - name: Install gensim and its dependencies (Windows)
+        if: matrix.os == 'windows'
+        run: pip install -e .[test-win]
+
+      - name: Build
+        run: |
+          python --version
+          pip --version
+          python setup.py build_ext --inplace
+
+      #
+      # Some of our tests are hanging.
+      # Limit the use of the coverage plugin for pytest to rule it out as a factor.
+      #
+      - name: Run tests (without coverage)
+        if: matrix.coverage != true
+        run: pytest -v gensim/test
+
+      - name: Run tests (with coverage)
+        if: matrix.coverage == true
+        run: pytest -v gensim/test --cov=gensim/ --cov-report=xml
+
       - name: Upload coverage to Codecov
-        if: matrix.os == 'ubuntu-20.04' && matrix.python == '3.8'
+        if: matrix.coverage == true
         uses: codecov/codecov-action@v2
         with:
           fail_ci_if_error: true
           files: ./coverage.xml
           verbose: true
 
-
       - name: Collect corefile
         if: ${{ failure() }} && matrix.os == 'ubuntu-20.04'
         run: |
diff --git a/gensim/models/fasttext.py b/gensim/models/fasttext.py
index 6d992d9b94..5ea5077a0c 100644
--- a/gensim/models/fasttext.py
+++ b/gensim/models/fasttext.py
@@ -1045,7 +1045,7 @@ def __contains__(self, word):
 
         Note
         ----
-        This method **always** returns True, because of the way FastText works.
+        This method **always** returns True with char ngrams, because of the way FastText works.
 
         If you want to check if a word is an in-vocabulary term, use this instead:
 
@@ -1059,7 +1059,10 @@ def __contains__(self, word):
             False
 
         """
-        return True
+        if self.bucket == 0:  # check for the case when char ngrams not used
+            return word in self.key_to_index
+        else:
+            return True
 
     def save(self, *args, **kwargs):
         """Save object.
@@ -1131,6 +1134,23 @@ def get_vector(self, word, norm=False):
             else:
                 return word_vec / len(ngram_hashes)
 
+    def get_sentence_vector(self, sentence):
+        """Get a single 1-D vector representation for a given `sentence`.
+        This function is workalike of the official fasttext's get_sentence_vector().
+
+        Parameters
+        ----------
+        sentence : list of (str or int)
+            list of words specified by string or int ids.
+
+        Returns
+        -------
+        numpy.ndarray
+            1-D numpy array representation of the `sentence`.
+
+        """
+        return super(FastTextKeyedVectors, self).get_mean_vector(sentence)
+
     def resize_vectors(self, seed=0):
         """Make underlying vectors match 'index_to_key' size; random-initialize any new rows."""
 
diff --git a/gensim/models/keyedvectors.py b/gensim/models/keyedvectors.py
index f56adb0b14..0dd043c2df 100644
--- a/gensim/models/keyedvectors.py
+++ b/gensim/models/keyedvectors.py
@@ -174,8 +174,8 @@
 from typing import Iterable
 
 from numpy import (
-    dot, float32 as REAL, double, array, zeros, vstack,
-    ndarray, sum as np_sum, prod, argmax, dtype, ascontiguousarray, frombuffer,
+    dot, float32 as REAL, double, zeros, vstack, ndarray,
+    sum as np_sum, prod, argmax, dtype, ascontiguousarray, frombuffer,
 )
 import numpy as np
 from scipy import stats
@@ -203,6 +203,9 @@ def _ensure_list(value):
     if isinstance(value, _KEY_TYPES) or (isinstance(value, ndarray) and len(value.shape) == 1):
         return [value]
 
+    if isinstance(value, ndarray) and len(value.shape) == 2:
+        return list(value)
+
     return value
 
 
@@ -274,6 +277,9 @@ def _load_specials(self, *args, **kwargs):
         # fixup rename of vocab into map
         if 'key_to_index' not in self.__dict__:
             self._upconvert_old_vocab()
+        # ensure older instances have next_index
+        if not hasattr(self, 'next_index'):
+            self.next_index = len(self)
 
     def _upconvert_old_vocab(self):
         """Convert a loaded, pre-gensim-4.0.0 version instance that had a 'vocab' dict of data objects."""
@@ -450,6 +456,71 @@ def word_vec(self, *args, **kwargs):
         """Compatibility alias for get_vector(); must exist so subclass calls reach subclass get_vector()."""
         return self.get_vector(*args, **kwargs)
 
+    def get_mean_vector(self, keys, weights=None, pre_normalize=True, post_normalize=False, ignore_missing=True):
+        """Get the mean vector for a given list of keys.
+
+        Parameters
+        ----------
+
+        keys : list of (str or int or ndarray)
+            Keys specified by string or int ids or numpy array.
+        weights : list of float or numpy.ndarray, optional
+            1D array of same size of `keys` specifying the weight for each key.
+        pre_normalize : bool, optional
+            Flag indicating whether to normalize each keyvector before taking mean.
+            If False, individual keyvector will not be normalized.
+        post_normalize: bool, optional
+            Flag indicating whether to normalize the final mean vector.
+            If True, normalized mean vector will be return.
+        ignore_missing : bool, optional
+            If False, will raise error if a key doesn't exist in vocabulary.
+
+        Returns
+        -------
+
+        numpy.ndarray
+            Mean vector for the list of keys.
+
+        Raises
+        ------
+
+        ValueError
+            If the size of the list of `keys` and `weights` doesn't match.
+        KeyError
+            If any of the key doesn't exist in vocabulary and `ignore_missing` is false.
+
+        """
+        if len(keys) == 0:
+            raise ValueError("cannot compute mean with no input")
+        if isinstance(weights, list):
+            weights = np.array(weights)
+        if weights is None:
+            weights = np.ones(len(keys))
+        if len(keys) != weights.shape[0]:  # weights is a 1-D numpy array
+            raise ValueError(
+                "keys and weights array must have same number of elements"
+            )
+
+        mean = np.zeros(self.vector_size, self.vectors.dtype)
+
+        total_weight = 0
+        for idx, key in enumerate(keys):
+            if isinstance(key, ndarray):
+                mean += weights[idx] * key
+                total_weight += abs(weights[idx])
+            elif self.__contains__(key):
+                vec = self.get_vector(key, norm=pre_normalize)
+                mean += weights[idx] * vec
+                total_weight += abs(weights[idx])
+            elif not ignore_missing:
+                raise KeyError(f"Key '{key}' not present in vocabulary")
+
+        if(total_weight > 0):
+            mean = mean / total_weight
+        if post_normalize:
+            mean = matutils.unitvec(mean).astype(REAL)
+        return mean
+
     def add_vector(self, key, vector):
         """Add one new vector at the given key, into existing slot if available.
 
@@ -714,10 +785,10 @@ def most_similar(
 
         Parameters
         ----------
-        positive : list of (str or int or ndarray), optional
-            List of keys that contribute positively.
-        negative : list of (str or int or ndarray), optional
-            List of keys that contribute negatively.
+        positive : list of (str or int or ndarray) or list of ((str,float) or (int,float) or (ndarray,float)), optional
+            List of keys that contribute positively. If tuple, second element specifies the weight (default `1.0`)
+        negative : list of (str or int or ndarray) or list of ((str,float) or (int,float) or (ndarray,float)), optional
+            List of keys that contribute negatively. If tuple, second element specifies the weight (default `-1.0`)
         topn : int or None, optional
             Number of top-N similar keys to return, when `topn` is int. When `topn` is None,
             then similarities for all keys are returned.
@@ -755,27 +826,20 @@ def most_similar(
             clip_end = restrict_vocab
 
         # add weights for each key, if not already present; default to 1.0 for positive and -1.0 for negative keys
-        positive = [
-            (item, 1.0) if isinstance(item, _EXTENDED_KEY_TYPES) else item
-            for item in positive
-        ]
-        negative = [
-            (item, -1.0) if isinstance(item, _EXTENDED_KEY_TYPES) else item
-            for item in negative
-        ]
+        keys = []
+        weight = np.concatenate((np.ones(len(positive)), -1.0 * np.ones(len(negative))))
+        for idx, item in enumerate(positive + negative):
+            if isinstance(item, _EXTENDED_KEY_TYPES):
+                keys.append(item)
+            else:
+                keys.append(item[0])
+                weight[idx] = item[1]
 
         # compute the weighted average of all keys
-        all_keys, mean = set(), []
-        for key, weight in positive + negative:
-            if isinstance(key, ndarray):
-                mean.append(weight * key)
-            else:
-                mean.append(weight * self.get_vector(key, norm=True))
-                if self.has_index_for(key):
-                    all_keys.add(self.get_index(key))
-        if not mean:
-            raise ValueError("cannot compute similarity with no input")
-        mean = matutils.unitvec(array(mean).mean(axis=0)).astype(REAL)
+        mean = self.get_mean_vector(keys, weight, pre_normalize=True, post_normalize=True, ignore_missing=False)
+        all_keys = [
+            self.get_index(key) for key in keys if isinstance(key, _KEY_TYPES) and self.has_index_for(key)
+        ]
 
         if indexer is not None and isinstance(topn, int):
             return indexer.most_similar(mean, topn)
@@ -943,7 +1007,9 @@ def nbow(document):
         # Compute WMD.
         return emd(d1, d2, distance_matrix)
 
-    def most_similar_cosmul(self, positive=None, negative=None, topn=10):
+    def most_similar_cosmul(
+            self, positive=None, negative=None, topn=10, restrict_vocab=None
+        ):
         """Find the top-N most similar words, using the multiplicative combination objective,
         proposed by `Omer Levy and Yoav Goldberg "Linguistic Regularities in Sparse and Explicit Word Representations"
         <http://www.aclweb.org/anthology/W14-1618>`_. Positive words still contribute positively towards the similarity,
@@ -956,6 +1022,9 @@ def most_similar_cosmul(self, positive=None, negative=None, topn=10):
         With a single positive example, rankings will be the same as in the default
         :meth:`~gensim.models.keyedvectors.KeyedVectors.most_similar`.
 
+        Allows calls like most_similar_cosmul('dog', 'cat'), as a shorthand for
+        most_similar_cosmul(['dog'], ['cat']) where 'dog' is positive and 'cat' negative
+
         Parameters
         ----------
         positive : list of str, optional
@@ -965,6 +1034,11 @@ def most_similar_cosmul(self, positive=None, negative=None, topn=10):
         topn : int or None, optional
             Number of top-N similar words to return, when `topn` is int. When `topn` is None,
             then similarities for all words are returned.
+        restrict_vocab : int or None, optional
+            Optional integer which limits the range of vectors which are searched for most-similar values.
+            For example, restrict_vocab=10000 would only check the first 10000 node vectors in the vocabulary order.
+            This may be meaningful if vocabulary is sorted by descending frequency.
+
 
         Returns
         -------
@@ -982,7 +1056,14 @@ def most_similar_cosmul(self, positive=None, negative=None, topn=10):
         positive = _ensure_list(positive)
         negative = _ensure_list(negative)
 
-        self.fill_norms()
+        self.init_sims()
+
+        if isinstance(positive, str):
+            # allow calls like most_similar_cosmul('dog'), as a shorthand for most_similar_cosmul(['dog'])
+            positive = [positive]
+
+        if isinstance(negative, str):
+            negative = [negative]
 
         all_words = {
             self.get_index(word) for word in positive + negative
@@ -1039,7 +1120,7 @@ def rank_by_centrality(self, words, use_norm=True):
         if not used_words:
             raise ValueError("cannot select a word from an empty list")
         vectors = vstack([self.get_vector(word, norm=use_norm) for word in used_words]).astype(REAL)
-        mean = matutils.unitvec(vectors.mean(axis=0)).astype(REAL)
+        mean = self.get_mean_vector(vectors, post_normalize=True)
         dists = dot(vectors, mean)
         return sorted(zip(dists, used_words), reverse=True)
 
@@ -1171,9 +1252,9 @@ def n_similarity(self, ws1, ws2):
         """
         if not(len(ws1) and len(ws2)):
             raise ZeroDivisionError('At least one of the passed list is empty.')
-        v1 = [self[key] for key in ws1]
-        v2 = [self[key] for key in ws2]
-        return dot(matutils.unitvec(array(v1).mean(axis=0)), matutils.unitvec(array(v2).mean(axis=0)))
+        mean1 = self.get_mean_vector(ws1, pre_normalize=False)
+        mean2 = self.get_mean_vector(ws2, pre_normalize=False)
+        return dot(matutils.unitvec(mean1), matutils.unitvec(mean2))
 
     @staticmethod
     def _log_evaluate_word_analogies(section):
@@ -1202,7 +1283,9 @@ def _log_evaluate_word_analogies(section):
         logger.info("%s: %.1f%% (%i/%i)", section['section'], 100.0 * score, correct, correct + incorrect)
         return score
 
-    def evaluate_word_analogies(self, analogies, restrict_vocab=300000, case_insensitive=True, dummy4unknown=False):
+    def evaluate_word_analogies(
+            self, analogies, restrict_vocab=300000, case_insensitive=True,
+            dummy4unknown=False, similarity_function='most_similar'):
         """Compute performance of the model on an analogy test set.
 
         The accuracy is reported (printed to log and returned as a score) for each section separately,
@@ -1228,6 +1311,8 @@ def evaluate_word_analogies(self, analogies, restrict_vocab=300000, case_insensi
         dummy4unknown : bool, optional
             If True - produce zero accuracies for 4-tuples with out-of-vocabulary words.
             Otherwise, these tuples are skipped entirely and not used in the evaluation.
+        similarity_function : str, optional
+            Function name used for similarity calculation.
 
         Returns
         -------
@@ -1283,6 +1368,7 @@ def evaluate_word_analogies(self, analogies, restrict_vocab=300000, case_insensi
                     predicted = None
                     # find the most likely prediction using 3CosAdd (vector offset) method
                     # TODO: implement 3CosMul and set-based methods for solving analogies
+
                     sims = self.most_similar(positive=[b, c], negative=[a], topn=5, restrict_vocab=restrict_vocab)
                     self.key_to_index = original_key_to_index
                     for element in sims:
diff --git a/gensim/models/lsimodel.py b/gensim/models/lsimodel.py
index 6a407e860e..8f8c9c511a 100644
--- a/gensim/models/lsimodel.py
+++ b/gensim/models/lsimodel.py
@@ -70,6 +70,7 @@
 
 from gensim import interfaces, matutils, utils
 from gensim.models import basemodel
+from gensim.utils import is_empty
 
 logger = logging.getLogger(__name__)
 
@@ -489,7 +490,8 @@ def add_documents(self, corpus, chunksize=None, decay=None):
             chunksize = self.chunksize
         if decay is None:
             decay = self.decay
-
+        if is_empty(corpus):
+            logger.warning('LsiModel.add_documents() called but no documents provided, is this intended?')
         if not scipy.sparse.issparse(corpus):
             if not self.onepass:
                 # we are allowed multiple passes over the input => use a faster, randomized two-pass algo
@@ -590,7 +592,8 @@ def __getitem__(self, bow, scaled=False, chunksize=512):
             Latent representation of corpus in BoW format if `bow` is corpus.
 
         """
-        assert self.projection.u is not None, "decomposition not initialized yet"
+        if self.projection.u is None:
+            raise ValueError('No training data provided - LSI model not initialized yet')
 
         # if the input vector is in fact a corpus, return a transformed corpus as a result
         is_corpus, bow = utils.is_corpus(bow)
diff --git a/gensim/test/test_fasttext.py b/gensim/test/test_fasttext.py
index 8922ee0ac9..ecc44a30e4 100644
--- a/gensim/test/test_fasttext.py
+++ b/gensim/test/test_fasttext.py
@@ -45,8 +45,7 @@
 BUCKET = 10000
 
 FT_HOME = os.environ.get("FT_HOME")
-FT_CMD = shutil.which("fasttext", path=FT_HOME) or \
-         shutil.which("fasttext")
+FT_CMD = shutil.which("fasttext", path=FT_HOME) or shutil.which("fasttext")
 
 
 new_sentences = [
@@ -374,6 +373,9 @@ def test_most_similar_cosmul(self):
         self.assertEqual(
             self.test_model.wv.most_similar_cosmul('nights'),
             self.test_model.wv.most_similar_cosmul(positive=['nights']))
+        self.assertEqual(
+            self.test_model.wv.most_similar_cosmul('the', 'and'),
+            self.test_model.wv.most_similar_cosmul(positive=['the'], negative=['and']))
 
     def test_lookup(self):
         # In vocab, sanity check
diff --git a/gensim/test/test_keyedvectors.py b/gensim/test/test_keyedvectors.py
index d5eda547ea..cc70577842 100644
--- a/gensim/test/test_keyedvectors.py
+++ b/gensim/test/test_keyedvectors.py
@@ -366,6 +366,35 @@ def test_no_header(self):
         self.assertEqual(randkv.index_to_key, reloadtxtkv.index_to_key)
         self.assertTrue((randkv.vectors == reloadtxtkv.vectors).all())
 
+    def test_get_mean_vector(self):
+        """Test get_mean_vector returns expected results."""
+        keys = [
+            'conflict',
+            'administration',
+            'terrorism',
+            'call',
+            'an out-of-vocabulary word',
+        ]
+        weights = [1, 2, 3, 1, 2]
+        expected_result_1 = np.array([
+            0.02000151, -0.12685453, 0.09196121, 0.25514853, 0.25740655,
+            -0.11134843, -0.0502661, -0.19278568, -0.83346179, -0.12068878,
+            ], dtype=np.float32)
+        expected_result_2 = np.array([
+            -0.0145228, -0.11530358, 0.1169825, 0.22537769, 0.29353586,
+            -0.10458107, -0.05272481, -0.17547795, -0.84245106, -0.10356515,
+            ], dtype=np.float32)
+        expected_result_3 = np.array([
+            0.01343237, -0.47651053, 0.45645328, 0.98304356, 1.1840123,
+            -0.51647933, -0.25308795, -0.77931081, -3.55954733, -0.55429711,
+            ], dtype=np.float32)
+
+        self.assertTrue(np.allclose(self.vectors.get_mean_vector(keys), expected_result_1))
+        self.assertTrue(np.allclose(self.vectors.get_mean_vector(keys, weights), expected_result_2))
+        self.assertTrue(np.allclose(
+            self.vectors.get_mean_vector(keys, pre_normalize=False), expected_result_3)
+        )
+
 
 class Gensim320Test(unittest.TestCase):
     def test(self):
diff --git a/gensim/test/test_translation_matrix.py b/gensim/test/test_translation_matrix.py
index c725fc0139..44ed22855e 100644
--- a/gensim/test/test_translation_matrix.py
+++ b/gensim/test/test_translation_matrix.py
@@ -1,6 +1,5 @@
 #!/usr/bin/env python
 # encoding: utf-8
-import sys
 from collections import namedtuple
 import unittest
 import logging
@@ -63,7 +62,7 @@ def test_translate_nn(self):
             self.assertTrue(item[1] in translated_words[item[0]])
 
     @pytest.mark.xfail(
-        sys.platform == 'darwin',
+        True,
         reason='blinking test, can be related to <https://github.com/RaRe-Technologies/gensim/issues/2977>'
     )
     def test_translate_gc(self):
diff --git a/gensim/test/test_word2vec.py b/gensim/test/test_word2vec.py
index 56a1ecfae0..8edfe3c04c 100644
--- a/gensim/test/test_word2vec.py
+++ b/gensim/test/test_word2vec.py
@@ -555,6 +555,12 @@ def test_evaluate_word_analogies(self):
         """Test that evaluating analogies on KeyedVectors give sane results"""
         model = word2vec.Word2Vec(LeeCorpus())
         score, sections = model.wv.evaluate_word_analogies(datapath('questions-words.txt'))
+        score_cosmul, sections_cosmul = model.wv.evaluate_word_analogies(
+            datapath('questions-words.txt'),
+            similarity_function='most_similar_cosmul'
+        )
+        self.assertEqual(score, score_cosmul)
+        self.assertEqual(sections, sections_cosmul)
         self.assertGreaterEqual(score, 0.0)
         self.assertLessEqual(score, 1.0)
         self.assertGreater(len(sections), 0)
diff --git a/gensim/utils.py b/gensim/utils.py
index d4fc6a71dc..78d64b88e6 100644
--- a/gensim/utils.py
+++ b/gensim/utils.py
@@ -30,6 +30,7 @@
 from copy import deepcopy
 from datetime import datetime
 import platform
+import types
 
 import numpy as np
 import scipy.sparse
@@ -2084,3 +2085,19 @@ def effective_n_jobs(n_jobs):
     elif n_jobs < 0:
         n_jobs = max(multiprocessing.cpu_count() + 1 + n_jobs, 1)
     return n_jobs
+
+
+def is_empty(corpus):
+    """Is the corpus (an iterable or a scipy.sparse array) empty?"""
+    if scipy.sparse.issparse(corpus):
+        return corpus.shape[1] == 0  # by convention, scipy.sparse documents are columns
+    if isinstance(corpus, types.GeneratorType):
+        return False  # don't try to guess emptiness of generators, may lose elements irretrievably
+    try:
+        # list, numpy array etc
+        first_doc = next(iter(corpus))  # noqa: F841 (ignore unused variable)
+        return False  # first document exists => not empty
+    except StopIteration:
+        return True
+    except Exception:
+        return False
diff --git a/tox.ini b/tox.ini
deleted file mode 100644
index 566e331997..0000000000
--- a/tox.ini
+++ /dev/null
@@ -1,154 +0,0 @@
-[tox]
-minversion = 2.0
-envlist = {py37,py38,py39,py310}-{win,linux}, py38-linux-cov, flake8, docs, docs-upload, download-wheels, upload-wheels, test-pypi
-skipsdist = True
-platform = linux: linux
-           win: win64
-
-
-[flake8]
-ignore = E12, W503
-max-line-length = 120
-show-source = True
-
-
-[flake8-rst]
-filename = *.rst *.py
-max-line-length = 120
-ignore = E203,  # space before :
-         E402,  # module level import not at top of file
-         # Classes / functions in a docstring block generate those errors
-         E302,  # expected 2 blank lines, found 0
-         E305,  # expected 2 blank lines after class or function definition, found 0
-         F821,  # undefined name; remove once all docstrings are fully executable
-exclude = .venv, .git, .tox, dist, doc, build, gensim/models/deprecated
-
-
-[coverage:run]
-source=gensim
-
-[coverage:report]
-omit =
-    gensim/test/*
-    */__init__.py
-
-exclude_lines =
-    pragma: no cover
-    def __repr__
-    def __str__
-    raise AssertionError
-    raise NotImplementedError
-    if __name__ == .__main__.:
-
-ignore_errors = True
-
-#
-# Conditional factors https://tox.wiki/en/latest/config.html#factors
-#
-[pytest]
-addopts = -rfxEXs --durations=20 --showlocals
-
-[testenv]
-recreate = True
-
-install_command = python -m pip install --timeout=60 {env:TOX_PIP_OPTS:} {opts} {packages}
-
-deps =
-    pip>=19.1.1
-    linux: .[test]
-    win: .[test-win]
-
-setenv =
-    FT_HOME={env:FT_HOME:}
-    WR_HOME={env:WR_HOME:}
-    VOWPAL_WABBIT_PATH={env:VOWPAL_WABBIT_PATH:}
-    DTM_PATH={env:DTM_PATH:}
-    MALLET_HOME={env:MALLET_HOME:}
-    SKIP_NETWORK_TESTS={env:SKIP_NETWORK_TESTS:}
-    BOTO_CONFIG={env:BOTO_CONFIG:}
-    RUNNER_OS={env:RUNNER_OS:}
-    PYTHONHASHSEED=1
-    TOX_PARALLEL_NO_SPINNER=1
-
-commands =
-    python --version
-    pip --version
-    python setup.py build_ext --inplace
-    cov: pytest {posargs:gensim/test} --cov=gensim/ --cov-report=xml
-    !cov: pytest {posargs:gensim/test}
-
-
-[testenv:flake8]
-recreate = True
-deps =
-    # Pinned to 3.7.9 because >3.8.0 triggers "AttributeError: 'Namespace' object has no attribute 'output_file'"
-    # in flake8-rst. Apparently some bug in flake8-rst:
-    # https://gitlab.com/pycqa/flake8/-/issues/641
-    # https://github.com/kataev/flake8-rst/pull/23/files
-    flake8==3.7.9
-
-commands = flake8 gensim/ {posargs}
-
-
-[testenv:flake8-docs]
-recreate = True
-deps =
-   flake8-rst==0.7.2
-   flake8==3.7.9
-
-commands = flake8-rst gensim/ docs/ {posargs}
-
-
-[testenv:compile]
-basepython = python3
-recreate = True
-
-deps = numpy
-commands = python setup.py build_ext --inplace
-
-
-[testenv:docs]
-basepython = python3
-recreate = True
-whitelist_externals = make
-deps = .[docs]
-
-commands =
-    python setup.py build_ext --inplace
-    make -C docs/src clean html
-
-
-[testenv:docs-upload]
-recreate = True
-whitelist_externals = make
-deps = .[docs]
-changedir = docs/src
-
-commands = make clean html upload
-
-
-[testenv:download-wheels]
-deps = wheelhouse_uploader
-whitelist_externals = rm
-recreate = True
-
-commands =
-    rm -rf dist/
-    python setup.py sdist fetch_artifacts
-
-
-[testenv:upload-wheels]
-deps = twine
-
-commands = twine upload dist/*
-
-
-[testenv:test-pypi]
-deps = twine
-whitelist_externals = rm
-
-commands =
-    rm -rf dist/
-    python setup.py sdist
-    twine upload --repository-url https://test.pypi.org/legacy/ dist/*
-    ; Go to https://testpypi.python.org/pypi?name=gensim&:action=display and check result