nbertagnolli/get_feature_names.py

## get_feature_names.py
from sklearn.pipeline import FeatureUnion, Pipeline

def get_feature_names(model, names: List[str], name: str) -> List[str]:
    """Thie method extracts the feature names in order from a Sklearn Pipeline

    This method only works with composed Pipelines and FeatureUnions.  It will
    pull out all names using DFS from a model.

    Args:
        model: The model we are interested in
        names: The list of names of final featurizaiton steps
        name: The current name of the step we want to evaluate.

    Returns:
        feature_names: The list of feature names extracted from the pipeline.
    """

    # Check if the name is one of our feature steps.  This is the base case.
    if name in names:
        # If it has the named_steps atribute it's a pipeline and we need to access the features
        if hasattr(model, "named_steps"):
            return extract_feature_names(model.named_steps[name], name)
        # Otherwise get the feature directly
        else:
            return extract_feature_names(model, name)
    elif type(model) is Pipeline:
        feature_names = []
        for name in model.named_steps.keys():
            feature_names += get_feature_names(model.named_steps[name], names, name)
        return feature_names
    elif type(model) is FeatureUnion:
        feature_names= []
        for name, new_model in model.transformer_list:
            feature_names += get_feature_names(new_model, names, name)
        return feature_names
    # If it is none of the above do not add it.
    else:
        return []
	from sklearn.pipeline import FeatureUnion, Pipeline

	def get_feature_names(model, names: List[str], name: str) -> List[str]:
	"""Thie method extracts the feature names in order from a Sklearn Pipeline

	This method only works with composed Pipelines and FeatureUnions. It will
	pull out all names using DFS from a model.

	Args:
	model: The model we are interested in
	names: The list of names of final featurizaiton steps
	name: The current name of the step we want to evaluate.

	Returns:
	feature_names: The list of feature names extracted from the pipeline.
	"""

	# Check if the name is one of our feature steps. This is the base case.
	if name in names:
	# If it has the named_steps atribute it's a pipeline and we need to access the features
	if hasattr(model, "named_steps"):
	return extract_feature_names(model.named_steps[name], name)
	# Otherwise get the feature directly
	else:
	return extract_feature_names(model, name)
	elif type(model) is Pipeline:
	feature_names = []
	for name in model.named_steps.keys():
	feature_names += get_feature_names(model.named_steps[name], names, name)
	return feature_names
	elif type(model) is FeatureUnion:
	feature_names= []
	for name, new_model in model.transformer_list:
	feature_names += get_feature_names(new_model, names, name)
	return feature_names
	# If it is none of the above do not add it.
	else:
	return []