function plotData(X, y)
%PLOTDATA Plots the data points X and y into a new figure
% PLOTDATA(x,y) plots the data points with + for the positive examples
% and o for the negative examples. X is assumed to be a Mx2 matrix.
% Create New Figure
figure; hold on;
% ====================== YOUR CODE HERE ======================
% Instructions: Plot the positive and negative examples on a
% 2D plot, using the option 'k+' for the positive
% examples and 'ko' for the negative examples.
%
pos = find(y==1);
neg = find(y==0);
plot(X(pos,1),X(pos,2),'k+','Linewidth',2,'MarkerSize',7);
hold on;
plot(X(neg,1),X(neg,2),'ko','MarkerFaceColor','y','MarkerSize',7);
% =========================================================================
hold off;
end
点除、点平方要注意
function g = sigmoid(z)
%SIGMOID Compute sigmoid function
% g = SIGMOID(z) computes the sigmoid of z.
% You need to return the following variables correctly
g = zeros(size(z));
% ====================== YOUR CODE HERE ======================
% Instructions: Compute the sigmoid of each value of z (z can be a matrix,
% vector or scalar).
g = 1./(1+e.^(-z));
% =============================================================
end
注意是矩阵,所以是点除、点乘,还有要求和(所有样本的CostFuction最后相加算出总的)
别漏了grad
function [J, grad] = costFunction(theta, X, y)
%COSTFUNCTION Compute cost and gradient for logistic regression
% J = COSTFUNCTION(theta, X, y) computes the cost of using theta as the
% parameter for logistic regression and the gradient of the cost
% w.r.t. to the parameters.
% Initialize some useful values
m = length(y); % number of training examples
% You need to return the following variables correctly
J = 0;
grad = zeros(size(theta));
% ====================== YOUR CODE HERE ======================
% Instructions: Compute the cost of a particular choice of theta.
% You should set J to the cost.
% Compute the partial derivatives and set grad to the partial
% derivatives of the cost w.r.t. each parameter in theta
%
% Note: grad should have the same dimensions as theta
%
h = sigmoid(X*theta);
J = 1/m*sum((-y.*log(h)-(1-y).*log(1-h)));
grad = 1/m*X'*(h-y);
% =============================================================
end
别忘了输出的是1和0
function p = predict(theta, X)
%PREDICT Predict whether the label is 0 or 1 using learned logistic
%regression parameters theta
% p = PREDICT(theta, X) computes the predictions for X using a
% threshold at 0.5 (i.e., if sigmoid(theta'*x) >= 0.5, predict 1)
m = size(X, 1); % Number of training examples
% You need to return the following variables correctly
p = zeros(m, 1);
% ====================== YOUR CODE HERE ======================
% Instructions: Complete the following code to make predictions using
% your learned logistic regression parameters.
% You should set p to a vector of 0's and 1's
%
p = sigmoid(X*theta);
pos = find(p>=0.5);
neg = find(p<0.5);
p(pos,1) = 1;
p(neg,1) = 0;
% =========================================================================
end
在这里卡了特别久,要注意的是regularize的时候J和grad后面都是不包含theta1的
同时要注意函数的思想
一开始我用的theta(2:28,1)、X(:,2:28)、grad(2:28),在运行ex2_reg的时候是正确的,但是submit()的时候错了,提示超出了维度,原来就是在于submit的时候,会用另外一组数据去测试你的函数是否能实现功能并且具有通用性,因此要用length()去表示矩阵的维度而不是直接手打数字进去,这样换一组数据这个函数就不适用了
非常感谢Andrew Ng帮我纠正这个坏习惯!~
function [J, grad] = costFunctionReg(theta, X, y, lambda)
%COSTFUNCTIONREG Compute cost and gradient for logistic regression with regularization
% J = COSTFUNCTIONREG(theta, X, y, lambda) computes the cost of using
% theta as the parameter for regularized logistic regression and the
% gradient of the cost w.r.t. to the parameters.
% Initialize some useful values
m = length(y); % number of training examples
% You need to return the following variables correctly
J = 0;
grad = zeros(size(theta));
% ====================== YOUR CODE HERE ======================
% Instructions: Compute the cost of a particular choice of theta.
% You should set J to the cost.
% Compute the partial derivatives and set grad to the partial
% derivatives of the cost w.r.t. each parameter in theta
h = sigmoid(X*theta);
J = 1/m*sum((-y.*log(h)-(1-y).*log(1-h)))+lambda/(2*m)*theta(2:length(theta),1)'*theta(2:length(theta),1);
grad(1) = 1/m*X(:,1)'*(h-y);
grad(2:length(theta)) = 1/m*X(:,2:length(theta))'*(h-y)+lambda/m*theta(2:length(theta),1);
% =============================================================
end