Finished first part of task 1

2016-10-19 09:33:01 +01:00
commit b9486fc422
15 changed files with 422 additions and 0 deletions
@@ -0,0 +1,9 @@
 function hypothesis = calculate_hypothesis(X, theta, training_example)
    %CALCULATE_HYPOTHESIS This calculates the hypothesis for a given X,
    %theta and specified training example
    x0 = X(training_example, 1);
    x1 = X(training_example, 2);
    hypothesis = theta(1)*x0+theta(2)*x1;
 end
@@ -0,0 +1,17 @@
 function J = compute_cost(X, y, theta)
    %COMPUTE_COST Compute cost for linear regression. Takes as input
    %matrix X of training examples, a parameter vector, theta, and an
    %output vector y
    J = 0.0; %cost
    m = size(y, 1); %number of training examples
    for i = 1:m
        hypothesis = calculate_hypothesis(X, theta, i);
        output = y(i);
        squared_error = (hypothesis - output) ^ 2;
        J = J + squared_error;
    end
    J = J * (1.0 / (2 * m));
 end
@@ -0,0 +1,25 @@
 function J = compute_cost_regularised(X, y, theta, l)
    %COMPUTE_COST_REGULARISED Compute cost for regularised linear regression.
    %Takes as input matrix X of training examples, a parameter vector, theta, 
    %lambda (l) and an output vector y
    total_squared_error = 0.0; %cost
    m = size(y, 1); %number of training examples
    for i = 1:m
        hypothesis = calculate_hypothesis(X, theta, i);
        output = y(i);
        squared_error = (hypothesis - output) ^ 2;
        total_squared_error = total_squared_error + squared_error;
    end
    total_regularised_error = 0.0;
    for i = 2:length(theta)
        total_regularised_error = total_regularised_error + theta(i) ^ 2;
    end
    total_regularised_error = total_regularised_error * l;
    J = (1.0 / (2 * m)) * (total_squared_error + total_regularised_error);
 end
@@ -0,0 +1,97 @@
 6.1101,17.592
 5.5277,9.1302
 8.5186,13.662
 7.0032,11.854
 5.8598,6.8233
 8.3829,11.886
 7.4764,4.3483
 8.5781,12
 6.4862,6.5987
 5.0546,3.8166
 5.7107,3.2522
 14.164,15.505
 5.734,3.1551
 8.4084,7.2258
 5.6407,0.71618
 5.3794,3.5129
 6.3654,5.3048
 5.1301,0.56077
 6.4296,3.6518
 7.0708,5.3893
 6.1891,3.1386
 20.27,21.767
 5.4901,4.263
 6.3261,5.1875
 5.5649,3.0825
 18.945,22.638
 12.828,13.501
 10.957,7.0467
 13.176,14.692
 22.203,24.147
 5.2524,-1.22
 6.5894,5.9966
 9.2482,12.134
 5.8918,1.8495
 8.2111,6.5426
 7.9334,4.5623
 8.0959,4.1164
 5.6063,3.3928
 12.836,10.117
 6.3534,5.4974
 5.4069,0.55657
 6.8825,3.9115
 11.708,5.3854
 5.7737,2.4406
 7.8247,6.7318
 7.0931,1.0463
 5.0702,5.1337
 5.8014,1.844
 11.7,8.0043
 5.5416,1.0179
 7.5402,6.7504
 5.3077,1.8396
 7.4239,4.2885
 7.6031,4.9981
 6.3328,1.4233
 6.3589,-1.4211
 6.2742,2.4756
 5.6397,4.6042
 9.3102,3.9624
 9.4536,5.4141
 8.8254,5.1694
 5.1793,-0.74279
 21.279,17.929
 14.908,12.054
 18.959,17.054
 7.2182,4.8852
 8.2951,5.7442
 10.236,7.7754
 5.4994,1.0173
 20.341,20.992
 10.136,6.6799
 7.3345,4.0259
 6.0062,1.2784
 7.2259,3.3411
 5.0269,-2.6807
 6.5479,0.29678
 7.5386,3.8845
 5.0365,5.7014
 10.274,6.7526
 5.1077,2.0576
 5.7292,0.47953
 5.1884,0.20421
 6.3557,0.67861
 9.7687,7.5435
 6.5159,5.3436
 8.5172,4.2415
 9.1802,6.7981
 6.002,0.92695
 5.5204,0.152
 5.0594,2.8214
 5.7077,1.8451
 7.6366,4.2959
 5.8707,7.2029
 5.3054,1.9869
 8.2934,0.14454
 13.394,9.0551
 5.4369,0.61705
@@ -0,0 +1,47 @@
 2104,3,399900
 1600,3,329900
 2400,3,369000
 1416,2,232000
 3000,4,539900
 1985,4,299900
 1534,3,314900
 1427,3,198999
 1380,3,212000
 1494,3,242500
 1940,4,239999
 2000,3,347000
 1890,3,329999
 4478,5,699900
 1268,3,259900
 2300,4,449900
 1320,2,299900
 1236,3,199900
 2609,4,499998
 3031,4,599000
 1767,3,252900
 1888,2,255000
 1604,3,242900
 1962,4,259900
 3890,3,573900
 1100,3,249900
 1458,3,464500
 2526,3,469000
 2200,3,475000
 2637,3,299900
 1839,2,349900
 1000,1,169900
 2040,4,314900
 3137,3,579900
 1811,4,285900
 1437,3,249900
 1239,3,229900
 2132,4,345000
 4215,4,549000
 2162,4,287000
 1664,2,368500
 2238,3,329900
 2567,4,314000
 1200,3,299000
 852,2,179900
 1852,4,299900
 1203,3,239500
@@ -0,0 +1,71 @@
 function theta = gradient_descent(X, y, theta, alpha, iterations, do_plot)
    %GRADIENT_DESCENT do Gradient Descent for a given X, y, theta, alpha
    %for a specified number of iterations
    %if less than 6 arguments was given, then set do_plot to be false
    if nargin < 6
        do_plot = false;
    end
    if(do_plot)
        plot_hypothesis(X, y, theta);
        drawnow; pause(0.1); 
    end
    m = size(X, 1); %number of training examples
    cost_vector = []; %will store the results of our cost function
    for it = 1:iterations
        %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%
        % gradient descent
        %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%
        theta_0 = theta(1);
        theta_1 = theta(2);
        %update theta(1) and store in temporary variable theta_0
        sigma = 0.0;
        for i = 1:m
            hypothesis = X(i, 1) * theta(1) + X(i, 2) * theta(2);
            output = y(i);
            sigma = sigma + (hypothesis - output);
        end
        theta_0 = theta_0 - ((alpha * 1.0) / m) * sigma;
        %update theta(2) and store in temporary variable theta_1
        sigma = 0.0;
        for i = 1:m
            hypothesis = X(i, 1) * theta(1) + X(i, 2) * theta(2);
            output = y(i);
            sigma = sigma + (hypothesis - output) * X(i, 2);
        end
        theta_1 = theta_1 - ((alpha * 1.0) / m) * sigma;
        %update theta
        theta = [theta_0, theta_1];
        %update cost_vector
        cost_vector = [cost_vector; compute_cost(X, y, theta)];
        if do_plot
            plot_hypothesis(X, y, theta);
            drawnow; pause(0.1); 
        end
    end
    disp 'Gradient descent is finished.'
    if do_plot
        disp 'Press enter!'
        pause;
    end
    plot_cost(cost_vector);
    disp 'Press enter!';
    pause;
 end
@@ -0,0 +1,7 @@
 function hypothesis_vec = hypothesis_to_vector(X, theta)
    hypothesis_vec = [];
    for i = 1:size(X, 1)
        hypothesis_vec = [hypothesis_vec; calculate_hypothesis(X, theta, i)];
    end
 end
@@ -0,0 +1,14 @@
 function [X, y] = load_data_ex1()
 %loads the data for excercise 1
    %read our data from a text file
    data = dlmread('ex1data1.txt');
    %load from the first column into X
    X = data(:, 1);
    %load from the second column into y
    y = data(:, 2);
    %add 1 to the input vector
    X = [ones(size(X, 1), 1), X];
 end
@@ -0,0 +1,11 @@
 function [X, y] = load_data_ex2()
 %loads the data for excercise 2
    %read our data from a text file
    data = dlmread('ex1data2.txt');
    %load from the first two columns into X
    X = data(:, 1:2);
    %load from the third column into y
    y = data(:, 3);
 end
@@ -0,0 +1,14 @@
 %% This loads our data
 [X, y] = load_data_ex1();
 %% initialize
 theta = [0.0, 0.0]; %The weights of our model.
 alpha = 0.01; %The step size for gradient descent.
 iterations = 50;
 %do plotting
 do_plot = true;
 %% run gradient descent
 t = gradient_descent(X, y, theta, alpha, iterations, do_plot);
@@ -0,0 +1,18 @@
 %% This loads our data
 [X, y] = load_data_ex2();
 %% Normalise and initialize.
 [X, mean_vec, std_vec] = normalise_features(X);
 %after normalising we add the bias
 X = [ones(size(X, 1), 1), X];
 %initialise theta
 theta = [0.0, 0.0, 0.0];
 alpha = 0.1;
 iterations = 100;
 %% 
 t = gradient_descent(X, y, theta, alpha, iterations);
 disp 'Press enter to exit!';
 pause;
@@ -0,0 +1,60 @@
 function mllab3()
    % load input data
    X = [-0.99768; -0.69574; -0.40373; -0.10236; 0.22024;  0.47742;  0.82229];
    % load output data
    y = [2.0885; 1.1646; 0.3287; 0.46013; 0.44808; 0.10013; -0.32952];
    % insert the bias into the input data
    X = [ones(size(X, 1), 1), X];
    % perform a polynomial expansion to the fifth order
    for j = 2:5
        X = [X, X(:, 2) .^ j];
    end
    % initialise theta
    theta = [1.0, 1.0, 1.0, 1.0, 1.0];
    alpha = 0.01;
    l = 0.0;
    iterations = 1000;
    do_plot = false;
    % run gradient descent
    % you will need to modify the gradient_descent function to accept an
    % additional argument lambda (l).
    theta = gradient_descent(X, y, theta, alpha, iterations, l, do_plot)
    % plot the original data
    original_x = [-0.99768; -0.69574; -0.40373; -0.10236; 0.22024;  0.47742;  0.82229];
    figure(1);
    plot(original_x, y, 'x');
    hold on;
    x = linspace(-1, 1, 1000);
    y = [];
    for index = 1:1000
        y = [y, get_hypothesis(x(index), theta)];
    end
    plot(x, y,'-');
    disp 'Press enter to exit.';
    pause;
    close(1);
 end
 function hypothesis = get_hypothesis(x, theta)
 % helper function which we will use to calculate the
 % hypothesis for a given x and theta
    hypothesis = 0.0;
    for t = 1:length(theta)
        hypothesis = hypothesis + theta(t) * (x ^ (t - 1));
    end
 end
@@ -0,0 +1,14 @@
 function [N, mean_vector, std_vector] = normalise_features(X)
    %NORMALISE_FEATURES Normalise our features by subtracting the mean and
    %dividing by the standard deviation
    num_rows = size(X, 1);
    mean_vector = mean(X);
    std_vector = std(X);
    %subtract column mean
    N = X - ones(num_rows, 1) * mean_vector;
    %divide each element by column standard deviation
    N = N ./ (ones(num_rows, 1) * std_vector);
 end
@@ -0,0 +1,8 @@
 function plot_cost(J)
    figure(2);
    plot(J);
    xlabel('itarations');
    ylabel('cost');
 end
@@ -0,0 +1,10 @@
 function plot_hypothesis(X, y, theta)
    figure(1);
    clf(1);
    plot(X(:, 2), y, 'rx');
    hold on;
    plot(X(:, 2), hypothesis_to_vector(X, theta));
    xlabel('x'); ylabel('y=f(x)');
 end