Source code for orangecontrib.text.topics.lsi

from numpy import float64
from gensim.models import LsiModel

from .topics import GensimWrapper

class LsiModelProxy(LsiModel):
    update = LsiModel.add_documents

    def add_documents(self, corpus, chunksize=None, decay=None):
        add_documents calls update which is equal to super().add_documents

        It is made because of mechanism in which disables update in
        some cases. In case of Lsi disabling update must results in disabling
        self.update(corpus, chunksize, decay)

[docs]class LsiWrapper(GensimWrapper): name = 'Latent Semantic Indexing' Model = LsiModelProxy has_negative_weights = True
[docs] def __init__(self, **kwargs): super().__init__(**kwargs, dtype=float64, random_seed=0)