有人可以帮助我从网格搜索中提取性能最佳的模型参数吗? 由于某种原因,它是空白的字典。
from pyspark.ml.tuning import ParamGridBuilder, TrainValidationSplit, CrossValidator
from pyspark.ml.evaluation import BinaryClassificationEvaluator
train, test = df.randomSplit([0.66, 0.34], seed=12345)
paramGrid = (ParamGridBuilder()
.addGrid(lr.regParam, [0.01,0.1])
.addGrid(lr.elasticNetParam, [1.0,])
.addGrid(lr.maxIter, [3,])
.build())
evaluator = BinaryClassificationEvaluator(rawPredictionCol="rawPrediction",labelCol="buy")
evaluator.setMetricName('areaUnderROC')
cv = CrossValidator(estimator=pipeline,
estimatorParamMaps=paramGrid,
evaluator=evaluator,
numFolds=2)
cvModel = cv.fit(train)
> print(cvModel.bestModel) #it looks like I have a valid bestModel
PipelineMod