src.fairreckitlib.model.pipeline.model_pipeline API documentation

ModelPipeline( algo_factory: src.fairreckitlib.core.config.config_factories.Factory, data_transition: src.fairreckitlib.data.data_transition.DataTransition, event_dispatcher: src.fairreckitlib.core.events.event_dispatcher.EventDispatcher) View Source

69    def __init__(
70            self,
71            algo_factory: Factory,
72            data_transition: DataTransition,
73            event_dispatcher: EventDispatcher):
74        """Construct the model pipeline.
75
76        Args:
77            algo_factory: factory of available algorithms for this API.
78            data_transition: data input.
79            event_dispatcher: used to dispatch model/IO events when running the pipeline.
80        """
81        CorePipeline.__init__(self, event_dispatcher)
82        self.algo_factory = algo_factory
83        self.data_transition = data_transition
84        self.tested_models = {}
85
86        self.train_set_matrix = None
87        self.test_set_users = None

Construct the model pipeline.

Args: algo_factory: factory of available algorithms for this API. data_transition: data input. event_dispatcher: used to dispatch model/IO events when running the pipeline.

def run( self, output_dir: str, models_config: List[src.fairreckitlib.model.pipeline.model_config.ModelConfig], is_running: Callable[[], bool], **kwargs) -> List[str]: View Source

 89    def run(self,
 90            output_dir: str,
 91            models_config: List[ModelConfig],
 92            is_running: Callable[[], bool],
 93            **kwargs) -> List[str]:
 94        """Run the entire pipeline from beginning to end.
 95
 96        Effectively running all computations of the specified models.
 97
 98        Args:
 99            output_dir: the path of the directory to store the output.
100            models_config: list of ModelConfig objects to compute.
101            is_running: function that returns whether the pipeline
102                is still running. Stops early when False is returned.
103
104        Keyword Args:
105            num_threads(int): the max number of threads an algorithm can use.
106            num_items(int): the number of item recommendations to produce, only
107                needed when running the pipeline for recommender algorithms.
108            rated_items_filter(bool): whether to filter already rated items when
109                producing item recommendations.
110
111        Raises:
112            FileNotFoundError: when either the train and/or test fails to load.
113
114        Returns:
115            a list of model directories where computation results are stored.
116        """
117        result_dirs = []
118        if not is_running():
119            return result_dirs
120
121        self.event_dispatcher.dispatch(ModelPipelineEventArgs(
122            ON_BEGIN_MODEL_PIPELINE,
123            self.algo_factory.get_name(),
124            models_config
125        ))
126
127        start = time.time()
128
129        # this can raise a FileNotFoundError, effectively aborting the pipeline
130        self.load_train_set_matrix()
131        if not is_running():
132            return result_dirs
133
134        # this can raise a FileNotFoundError, effectively aborting the pipeline
135        self.load_test_set_users()
136        if not is_running():
137            return result_dirs
138
139        for model in models_config:
140            # verify that the specified model is available
141            if not self.algo_factory.is_obj_available(model.name):
142                self.event_dispatcher.dispatch(ErrorEventArgs(
143                    ON_FAILURE_ERROR,
144                    'Failure: algorithm is not available: ' +
145                    self.algo_factory.get_name() + ' ' + model.name
146                ))
147                continue
148
149            # create model output dir
150            model_dir = self.create_model_output_dir(
151                output_dir,
152                model.name
153            )
154
155            # attempt to run the model computation
156            try:
157                self.run_model(
158                    model_dir,
159                    model,
160                    is_running,
161                    **kwargs
162                )
163            except ArithmeticError:
164                self.event_dispatcher.dispatch(ErrorEventArgs(
165                    ON_RAISE_ERROR,
166                    'ArithmeticError: trying to run model ' +
167                    self.algo_factory.get_name() + ' ' + model.name
168                ))
169                delete_dir(model_dir, self.event_dispatcher)
170                continue
171            except MemoryError:
172                self.event_dispatcher.dispatch(ErrorEventArgs(
173                    ON_RAISE_ERROR,
174                    'MemoryError: trying to run model ' +
175                    self.algo_factory.get_name() + ' ' + model.name
176                ))
177                delete_dir(model_dir, self.event_dispatcher)
178                continue
179            except RuntimeError:
180                self.event_dispatcher.dispatch(ErrorEventArgs(
181                    ON_RAISE_ERROR,
182                    'RuntimeError: trying to run model ' +
183                    self.algo_factory.get_name() + ' ' + model.name
184                ))
185                delete_dir(model_dir, self.event_dispatcher)
186                continue
187
188            result_dirs.append(model_dir)
189            if not is_running():
190                return result_dirs
191
192        # free up some memory because everything is trained and tested
193        self.train_set_matrix = None
194        self.test_set_users = None
195
196        self.reconstruct_ratings(result_dirs, is_running)
197
198        end = time.time()
199
200        self.event_dispatcher.dispatch(ModelPipelineEventArgs(
201            ON_END_MODEL_PIPELINE,
202            self.algo_factory.get_name(),
203            models_config
204        ), elapsed_time=end - start)
205
206        return result_dirs

Run the entire pipeline from beginning to end.

Effectively running all computations of the specified models.

Args: output_dir: the path of the directory to store the output. models_config: list of ModelConfig objects to compute. is_running: function that returns whether the pipeline is still running. Stops early when False is returned.

Keyword Args: num_threads(int): the max number of threads an algorithm can use. num_items(int): the number of item recommendations to produce, only needed when running the pipeline for recommender algorithms. rated_items_filter(bool): whether to filter already rated items when producing item recommendations.

Raises: FileNotFoundError: when either the train and/or test fails to load.

Returns: a list of model directories where computation results are stored.

def run_model( self, model_dir: str, model_config: src.fairreckitlib.model.pipeline.model_config.ModelConfig, is_running: Callable[[], bool], **kwargs) -> None: View Source

208    def run_model(
209            self,
210            model_dir: str,
211            model_config: ModelConfig,
212            is_running: Callable[[], bool],
213            **kwargs) -> None:
214        """Run the model computation for the specified model configuration.
215
216        Args:
217            model_dir: the path of the directory where the computed ratings can be stored.
218            model_config: the algorithm model configuration.
219            is_running: function that returns whether the pipeline
220                is still running. Stops early when False is returned.
221
222        Keyword Args:
223            num_threads(int): the max number of threads an algorithm can use.
224            num_items(int): the number of item recommendations to produce, only
225                needed when running the pipeline for recommender algorithms.
226            rated_items_filter(bool): whether to filter already rated items when
227                producing item recommendations.
228
229        Raises:
230            ArithmeticError: possibly raised by a model on construction, training or testing.
231            MemoryError: possibly raised by a model on construction, training or testing.
232            RuntimeError: possibly raised by a model on construction, training or testing.
233        """
234        model, start = self.begin_model(
235            model_config.name,
236            model_config.params,
237            model_dir,
238            **kwargs
239        )
240        if not is_running():
241            return
242
243        self.train_and_test_model(model, model_dir, is_running, **kwargs)
244        if not is_running():
245            return
246
247        self.end_model(model, start)

Run the model computation for the specified model configuration.

Args: model_dir: the path of the directory where the computed ratings can be stored. model_config: the algorithm model configuration. is_running: function that returns whether the pipeline is still running. Stops early when False is returned.

Keyword Args: num_threads(int): the max number of threads an algorithm can use. num_items(int): the number of item recommendations to produce, only needed when running the pipeline for recommender algorithms. rated_items_filter(bool): whether to filter already rated items when producing item recommendations.

Raises: ArithmeticError: possibly raised by a model on construction, training or testing. MemoryError: possibly raised by a model on construction, training or testing. RuntimeError: possibly raised by a model on construction, training or testing.

def begin_model( self, model_name: str, model_params: Dict[str, Any], model_dir: str, **kwargs) -> Tuple[src.fairreckitlib.model.algorithms.base_algorithm.BaseAlgorithm, float]: View Source

249    def begin_model(
250            self,
251            model_name: str,
252            model_params: Dict[str, Any],
253            model_dir: str,
254            **kwargs) -> Tuple[BaseAlgorithm, float]:
255        """Prepare the model computation.
256
257        Resolves the output directory to create for the model computation,
258        so that it is unique and creates the model.
259
260        Args:
261            model_name: name of the model's algorithm.
262            model_params: parameters of the algorithm.
263            model_dir: the path of the directory where the computed ratings can be stored.
264
265        Keyword Args:
266            num_threads(int): the max number of threads an algorithm can use.
267            rated_items_filter(bool): whether to filter already rated items when
268                producing item recommendations.
269
270        Raises:
271            ArithmeticError: possibly raised by a model on construction.
272            MemoryError: possibly raised by a model on construction.
273            RuntimeError: possibly raised by a model on construction.
274
275        Returns:
276            model: the created model according the specified name and parameters.
277            start: the time when the model computation started.
278        """
279        start = time.time()
280
281        self.event_dispatcher.dispatch(ModelEventArgs(
282            ON_BEGIN_MODEL,
283            model_name,
284            model_params
285        ))
286
287        # attempt to create model
288        kwargs['rating_type'] = self.data_transition.get_rating_type()
289        model = self.algo_factory.create(
290            model_name,
291            model_params,
292            **kwargs
293        )
294
295        # create settings file
296        create_json(
297            os.path.join(model_dir, 'settings.json'),
298            model.get_params(),
299            self.event_dispatcher,
300            indent=4
301        )
302
303        return model, start

Prepare the model computation.

Resolves the output directory to create for the model computation, so that it is unique and creates the model.

Args: model_name: name of the model's algorithm. model_params: parameters of the algorithm. model_dir: the path of the directory where the computed ratings can be stored.

Keyword Args: num_threads(int): the max number of threads an algorithm can use. rated_items_filter(bool): whether to filter already rated items when producing item recommendations.

Raises: ArithmeticError: possibly raised by a model on construction. MemoryError: possibly raised by a model on construction. RuntimeError: possibly raised by a model on construction.

Returns: model: the created model according the specified name and parameters. start: the time when the model computation started.

def create_model_output_dir(self, output_dir: str, model_name: str) -> str: View Source

305    def create_model_output_dir(self, output_dir: str, model_name: str) -> str:
306        """Create the output directory for a model.
307
308        Args:
309            output_dir: the path of the directory to store the output.
310            model_name: name of the model's algorithm.
311
312        Returns:
313            the path of the directory where the model's computed ratings can be stored.
314        """
315        if self.tested_models.get(model_name) is None:
316            # initialize model name counter
317            self.tested_models[model_name] = 0
318
319        return create_dir(self.get_model_output_dir(output_dir, model_name), self.event_dispatcher)

Create the output directory for a model.

Args: output_dir: the path of the directory to store the output. model_name: name of the model's algorithm.

Returns: the path of the directory where the model's computed ratings can be stored.

def get_model_output_dir(self, output_dir: str, model_name: str) -> str: View Source

321    def get_model_output_dir(self, output_dir: str, model_name: str) -> str:
322        """Get the model output directory path for the specified model name.
323
324        Args:
325            output_dir: the path of the directory to store the output.
326            model_name: name of the model's algorithm.
327
328        Returns:
329            the path of the directory where the model's computed ratings can be stored.
330        """
331        index = self.tested_models[model_name]
332        return os.path.join(
333            output_dir,
334            self.algo_factory.get_name() + '_' + model_name + '_' + str(index)
335        )

Get the model output directory path for the specified model name.

Args: output_dir: the path of the directory to store the output. model_name: name of the model's algorithm.

Returns: the path of the directory where the model's computed ratings can be stored.

def end_model( self, model: src.fairreckitlib.model.algorithms.base_algorithm.BaseAlgorithm, start: float) -> None: View Source

337    def end_model(self, model: BaseAlgorithm, start: float) -> None:
338        """Finalize the model computation.
339
340        Updates the number of tested models so that additional
341        computations remain unique for this model.
342
343        Args:
344            model: the model that finished.
345            start: the time when the model computation started.
346        """
347        self.tested_models[model.get_name()] += 1
348
349        end = time.time()
350
351        self.event_dispatcher.dispatch(ModelEventArgs(
352            ON_END_MODEL,
353            model.get_name(),
354            model.get_params()
355        ), elapsed_time=end - start)

Finalize the model computation.

Updates the number of tested models so that additional computations remain unique for this model.

Args: model: the model that finished. start: the time when the model computation started.

def on_load_train_set_matrix(self) -> src.fairreckitlib.model.algorithms.matrix.Matrix: View Source

357    def on_load_train_set_matrix(self) -> Matrix:
358        """Load the train set matrix that all models can use for training.
359
360        The default train set matrix of the model pipeline is a dataframe.
361        Derived classes are allowed to override this function to return a different type of matrix.
362
363        Returns:
364            the loaded train set matrix dataframe.
365        """
366        return Matrix(self.data_transition.train_set_path)

Load the train set matrix that all models can use for training.

The default train set matrix of the model pipeline is a dataframe. Derived classes are allowed to override this function to return a different type of matrix.

Returns: the loaded train set matrix dataframe.

def load_train_set_matrix(self) -> None: View Source

368    def load_train_set_matrix(self) -> None:
369        """Load the train set matrix that all models can use for training.
370
371        Raises:
372            FileNotFoundError: when the train set file is not found.
373        """
374        self.event_dispatcher.dispatch(DataframeEventArgs(
375            ON_BEGIN_LOAD_TRAIN_SET,
376            self.data_transition.train_set_path,
377            'model train set matrix'
378        ))
379
380        start = time.time()
381
382        try:
383            self.train_set_matrix = self.on_load_train_set_matrix()
384        except FileNotFoundError as err:
385            self.event_dispatcher.dispatch(ErrorEventArgs(
386                ON_RAISE_ERROR,
387                'FileNotFoundError: raised while trying to load the matrix train set from ' +
388                self.data_transition.train_set_path
389            ))
390            raise err
391
392
393        end = time.time()
394
395        self.event_dispatcher.dispatch(DataframeEventArgs(
396            ON_END_LOAD_TRAIN_SET,
397            self.data_transition.train_set_path,
398            'model train set matrix'
399        ), elapsed_time=end - start)

Load the train set matrix that all models can use for training.

Raises: FileNotFoundError: when the train set file is not found.

def load_train_set_dataframe(self) -> pandas.core.frame.DataFrame: View Source

401    def load_train_set_dataframe(self) -> pd.DataFrame:
402        """Load the train set as a dataframe.
403
404        Raises:
405            FileNotFoundError: when the train set file is not found.
406
407        Returns:
408            the loaded train set dataframe.
409        """
410        return self.read_dataframe(
411            self.data_transition.train_set_path,
412            'data train set',
413            ON_BEGIN_LOAD_TRAIN_SET,
414            ON_END_LOAD_TRAIN_SET,
415            names=['user', 'item', 'rating']
416        )

Load the train set as a dataframe.

Raises: FileNotFoundError: when the train set file is not found.

Returns: the loaded train set dataframe.

def load_test_set_dataframe(self, test_name: str = 'data test set') -> pandas.core.frame.DataFrame: View Source

418    def load_test_set_dataframe(self, test_name: str='data test set') -> pd.DataFrame:
419        """Load the test set as a dataframe.
420
421        Args:
422            test_name: name of the test set dataframe to dispatch in the dataframe event.
423
424        Raises:
425            FileNotFoundError: when the test set file is not found.
426
427        Returns:
428            the loaded test set dataframe.
429        """
430        return self.read_dataframe(
431            self.data_transition.test_set_path,
432            test_name,
433            ON_BEGIN_LOAD_TEST_SET,
434            ON_END_LOAD_TEST_SET,
435            names=['user', 'item', 'rating']
436        )

Load the test set as a dataframe.

Args: test_name: name of the test set dataframe to dispatch in the dataframe event.

Raises: FileNotFoundError: when the test set file is not found.

Returns: the loaded test set dataframe.

@abstractmethod

def load_test_set_users(self) -> None: View Source

438    @abstractmethod
439    def load_test_set_users(self) -> None:
440        """Load the test set users that all models can use for testing.
441
442        Raises:
443            FileNotFoundError: when the test set file is not found.
444        """
445        raise NotImplementedError()

Load the test set users that all models can use for testing.

Raises: FileNotFoundError: when the test set file is not found.

def reconstruct_ratings(self, result_dirs: List[str], is_running: Callable[[], bool]) -> None: View Source

447    def reconstruct_ratings(
448            self,
449            result_dirs: List[str],
450            is_running: Callable[[], bool]) -> None:
451        """Reconstruct the original ratings for all the computed models ratings.
452
453        Args:
454            result_dirs: a list of directories that contain a computed rating file.
455            is_running: function that returns whether the pipeline
456                is still running. Stops early when False is returned.
457        """
458        if not is_running() or len(result_dirs) == 0:
459            return
460
461        # TODO should probably move this code to a separate pipeline
462        ratings_dataframe = pd.concat([
463            self.load_train_set_dataframe(),
464            self.load_test_set_dataframe()
465        ])
466
467        for model_dir in result_dirs:
468            if not is_running():
469                return
470
471            result_file_path = os.path.join(model_dir, MODEL_RATINGS_FILE)
472
473            self.event_dispatcher.dispatch(FileEventArgs(
474                ON_BEGIN_RECONSTRUCT_RATINGS,
475                result_file_path
476            ))
477
478            start = time.time()
479
480            result = pd.read_csv(result_file_path, sep='\t')
481            result = pd.merge(result, ratings_dataframe, how='left', on=['user', 'item'])
482            result.to_csv(result_file_path, sep='\t', header=True, index=False)
483
484            end = time.time()
485
486            self.event_dispatcher.dispatch(FileEventArgs(
487                ON_END_RECONSTRUCT_RATINGS,
488                result_file_path
489            ), elapsed_time=end - start)

Reconstruct the original ratings for all the computed models ratings.

Args: result_dirs: a list of directories that contain a computed rating file. is_running: function that returns whether the pipeline is still running. Stops early when False is returned.

def test_model( self, model: src.fairreckitlib.model.algorithms.base_algorithm.BaseAlgorithm, model_dir: str, is_running: Callable[[], bool], **kwargs) -> None: View Source

491    def test_model(
492            self,
493            model: BaseAlgorithm,
494            model_dir: str,
495            is_running: Callable[[], bool],
496            **kwargs) -> None:
497        """Test the specified model using the test set.
498
499        This function wraps the event dispatching and functionality
500        that both predictor and recommender models have in common.
501
502        Args:
503            model: the model that needs to be tested.
504            model_dir: the path of the directory where the computed ratings can be stored.
505            is_running: function that returns whether the pipeline
506                is still running. Stops early when False is returned.
507
508        Keyword Args:
509            num_items(int): the number of item recommendations to produce, only
510                needed when running the pipeline for recommender algorithms.
511
512        Raises:
513            ArithmeticError: possibly raised by a model on testing.
514            MemoryError: possibly raised by a model on testing.
515            RuntimeError: possibly raised by a model on testing.
516        """
517        self.event_dispatcher.dispatch(ModelEventArgs(
518            ON_BEGIN_TEST_MODEL,
519            model.get_name(),
520            model.get_params()
521        ))
522
523        start = time.time()
524
525        result_file_path = os.path.join(model_dir, MODEL_RATINGS_FILE)
526        start_index = 0
527        while start_index < len(self.test_set_users):
528            if not is_running():
529                return
530
531            user_batch = self.test_set_users[start_index : start_index + MODEL_USER_BATCH_SIZE]
532            ratings = self.test_model_ratings(model, user_batch, **kwargs)
533            if not is_running():
534                return
535
536            self.write_dataframe(result_file_path, ratings, start_index == 0)
537            start_index += MODEL_USER_BATCH_SIZE
538
539        end = time.time()
540
541        self.event_dispatcher.dispatch(ModelEventArgs(
542            ON_END_TEST_MODEL,
543            model.get_name(),
544            model.get_params()
545        ), elapsed_time=end - start)

Test the specified model using the test set.

This function wraps the event dispatching and functionality that both predictor and recommender models have in common.

Args: model: the model that needs to be tested. model_dir: the path of the directory where the computed ratings can be stored. is_running: function that returns whether the pipeline is still running. Stops early when False is returned.

Keyword Args: num_items(int): the number of item recommendations to produce, only needed when running the pipeline for recommender algorithms.

Raises: ArithmeticError: possibly raised by a model on testing. MemoryError: possibly raised by a model on testing. RuntimeError: possibly raised by a model on testing.

@abstractmethod

def test_model_ratings( self, model: src.fairreckitlib.model.algorithms.base_algorithm.BaseAlgorithm, user_batch: List[int], **kwargs) -> pandas.core.frame.DataFrame: View Source

547    @abstractmethod
548    def test_model_ratings(
549            self,
550            model: BaseAlgorithm,
551            user_batch: List[int],
552            **kwargs) -> pd.DataFrame:
553        """Test the specified model for rating predictions or recommendations.
554
555        Args:
556            model: the model that needs to be tested.
557            user_batch: the user batch to compute model ratings for.
558
559        Keyword Args:
560            num_items(int): the number of item recommendations to produce, only
561                needed when running the pipeline for recommender algorithms.
562
563        Raises:
564            ArithmeticError: possibly raised by a model on testing.
565            MemoryError: possibly raised by a model on testing.
566            RuntimeError: possibly raised by a model on testing.
567
568        Returns:
569            a dataframe containing the computed model ratings.
570        """
571        raise NotImplementedError()

Test the specified model for rating predictions or recommendations.

Args: model: the model that needs to be tested. user_batch: the user batch to compute model ratings for.

Keyword Args: num_items(int): the number of item recommendations to produce, only needed when running the pipeline for recommender algorithms.

Raises: ArithmeticError: possibly raised by a model on testing. MemoryError: possibly raised by a model on testing. RuntimeError: possibly raised by a model on testing.

Returns: a dataframe containing the computed model ratings.

def train_model( self, model: src.fairreckitlib.model.algorithms.base_algorithm.BaseAlgorithm) -> None: View Source

573    def train_model(self, model: BaseAlgorithm) -> None:
574        """Train the specified model using the train set.
575
576        Args:
577            model: the model that needs to be trained.
578
579        Raises:
580            ArithmeticError: possibly raised by a model on training.
581            MemoryError: possibly raised by a model on training.
582            RuntimeError: possibly raised by a model on training.
583        """
584        self.event_dispatcher.dispatch(ModelEventArgs(
585            ON_BEGIN_TRAIN_MODEL,
586            model.get_name(),
587            model.get_params()
588        ))
589
590        start = time.time()
591
592        model.train(self.train_set_matrix)
593
594        end = time.time()
595
596        self.event_dispatcher.dispatch(ModelEventArgs(
597            ON_END_TRAIN_MODEL,
598            model.get_name(),
599            model.get_params()
600        ), elapsed_time=end - start)

Train the specified model using the train set.

Args: model: the model that needs to be trained.

Raises: ArithmeticError: possibly raised by a model on training. MemoryError: possibly raised by a model on training. RuntimeError: possibly raised by a model on training.

def train_and_test_model( self, model: src.fairreckitlib.model.algorithms.base_algorithm.BaseAlgorithm, model_dir: str, is_running: Callable[[], bool], **kwargs) -> None: View Source

602    def train_and_test_model(
603            self,
604            model: BaseAlgorithm,
605            model_dir: str,
606            is_running: Callable[[], bool],
607            **kwargs) -> None:
608        """Train and test the specified model.
609
610        Several possible errors can be raised during the executing of both training and
611        testing the model: namely ArithmeticError, MemoryError and RuntimeError.
612
613        Args:
614            model: the model that needs to be trained.
615            model_dir: the path of the directory where the computed ratings can be stored.
616            is_running: function that returns whether the pipeline
617                is still running. Stops early when False is returned.
618
619        Raises:
620            ArithmeticError: possibly raised by a model on training or testing.
621            MemoryError: possibly raised by a model on training or testing.
622            RuntimeError: possibly raised by a model on training or testing.
623
624        Keyword Args:
625            num_items(int): the number of item recommendations to produce, only
626                needed when running the pipeline for recommender algorithms.
627        """
628        try:
629            self.train_model(model)
630        except (ArithmeticError, MemoryError, RuntimeError) as err:
631            self.event_dispatcher.dispatch(ErrorEventArgs(
632                ON_RAISE_ERROR,
633                'Error: raised while training model ' +
634                self.algo_factory.get_name() + ' ' + model.get_name()
635            ))
636            # raise again so the model run aborts
637            raise err
638
639        try:
640            self.test_model(model, model_dir, is_running, **kwargs)
641        except (ArithmeticError, MemoryError, RuntimeError) as err:
642            self.event_dispatcher.dispatch(ErrorEventArgs(
643                ON_RAISE_ERROR,
644                'Error: raised while testing model ' +
645                self.algo_factory.get_name() + ' ' + model.get_name()
646            ))
647            # raise again so the model run aborts
648            raise err

Train and test the specified model.

Several possible errors can be raised during the executing of both training and testing the model: namely ArithmeticError, MemoryError and RuntimeError.

Args: model: the model that needs to be trained. model_dir: the path of the directory where the computed ratings can be stored. is_running: function that returns whether the pipeline is still running. Stops early when False is returned.

Raises: ArithmeticError: possibly raised by a model on training or testing. MemoryError: possibly raised by a model on training or testing. RuntimeError: possibly raised by a model on training or testing.

Keyword Args: num_items(int): the number of item recommendations to produce, only needed when running the pipeline for recommender algorithms.

src.fairreckitlib.model.pipeline.model_pipeline

Inherited Members