我正在开发一个文本分类项目,并尝试使用 SVC(kernel= '线性') 来获取特征重要性。这是我的代码:(我更改了这篇文章
中的代码)
X = df1[features]
y = df1['label']
# Create selector class for text and numbers
class TextSelector(BaseEstimator, TransformerMixin):
"""Transformer to select a single column from the data frame to perform additional transformations on"""
def __init__(self, key):
self.key = key
def fit(self, X, y=None):
return self
def transform(self, X):
return X[self.key]
class NumberSelector(BaseEstimator, TransformerMixin):
"""For data grouped by feature, select subset of data at a provided key."""
def __init__(self, key):
self.key = key
def fit(self, X, …Run Code Online (Sandbox Code Playgroud)