Source code for py_entitymatching.matcher.rfmatcher

"""
This module contains the functions for Random Forest classifier.
"""

from py_entitymatching.matcher.mlmatcher import MLMatcher
from py_entitymatching.matcher.matcherutils import get_ts

from sklearn.ensemble import RandomForestClassifier

[docs]class RFMatcher(MLMatcher): """ Random Forest matcher. Args: *args,**kwargs: The arguments to scikit-learn's Random Forest classifier. name (string): The name of this matcher (defaults to None). If the matcher name is None, the class automatically generates a string and assigns it as the name. """ def __init__(self, *args, **kwargs): super(RFMatcher, self).__init__() # If the name is given, then pop it name = kwargs.pop('name', None) if name is None: # If the name of the matcher is give, then create one. # Currently, we use a constant string + a random number. self.name = 'RandomForest'+ '_' + get_ts() else: # Set the name of the matcher, with the given name. self.name = name # Set the classifier to the scikit-learn classifier. self.clf = RandomForestClassifier(*args, **kwargs)