format compact


nums = rand(10000,1);
%============
tic
total = zeros(10000,1);
for t=1:1000
    for i=1:10000
        total(i) = sin(nums(i));
    end
end
toc
%============
tic
for t=1:1000
    total = sin(nums);
end
toc


nums = rand(10000,1);
%============
tic
total = zeros(10000,1);
for t=1:1000
    for i=1:10000
        sin(nums(i));
    end
end
toc
%============
tic
for t=1:1000
    sin(nums);
end
toc


%%file test.m

function out = test(a,b)
    out = a + b;
end


%%file dummy.m

function out = dummy(in)
end


nums = randi(100,10000,1); % Creates a 10000x1 matrix with  random integers values 1 to 100 inclusive

% Original task:
tic
for t=1:10000
    total = 0;
    for i=1:10000
        total = total + nums(i);
    end
end
toc

% Function call overhead:
tic
for t=1:10000
    total = 0;
    for i=1:10000
        total = total + nums(i);
        dummy(42)
    end
end
toc

% Original task encapsulated in function to prevent JITing:
tic
for t=1:10000
    total = 0;
    for i=1:10000
        total = test(total, nums(i));
    end
end
toc

% Optimized built-ins are even better and should be used when possible:
tic
for t=1:10000
    total = sum(nums);
end
toc


nums = randi(100,10,1)


total = 0;
for i=1:numel(nums)
    total = total + nums(i);
end
total


%%file csum.m

% Calculate a cumulative sum from a to b
% Does same amount of work as we would for a "real" csum
function total = csum(a,b)
    total = 0;
    for i=a:b
        total = total + i;
    end
end


%%file csum2.m

% Calculate a cumulative sum from a to b
function total = csum2(a,b)
    total = zeros(numel(a:b),1);
    for i=a:b
        total(i) = total(i-1) + i;
    end
end


% Get all the cumulative sums from 1, for the numbers 1 to 100
tic
for i=1:(1*43000)
    myresults(i) = csum(1,i);
end
toc


logspace(1,5,13)


% Look at the running time as we increase the range of numbers we get the cumsum for
c = 1;
for N=logspace(1,5,13)
    tic
    for i=1:N
        myresults(i) = csum(1,i);
    end
    timings(c) = toc;
    c = c+1;
end
plot(logspace(1,5,13),timings,'o-')
xlabel("N")
ylabel("Runtime (s)")


% Remember "log rules":
log(2^8)
8*log(2)


% log-log plot of above, with linear regression in asymptotic region
loglog(logspace(1,5,13),timings,'o-')
xlabel("N")
ylabel("Runtime (s)")
polyfit(log(logspace(3,5,7)),log(timings(7:end)),1)


mysize=4300000;


clear myresults
tic
myresults(1)=1;
for i=2:mysize
    myresults(i) = myresults(i-1)+i;
end
toc
clear myresults


clear myresults
tic
myresults = zeros(mysize,1);
for i=2:mysize
    myresults(i) = myresults(i-1)+i;
end
toc
clear myresults


c = 1;
xx = logspace(1,7,13);
for N=xx
    tic
    myresults(1)=1;
    for i=2:N
        myresults(i) = myresults(i-1)+i;
    end
    timings(c) = toc;
    c = c+1;
end
loglog(xx,timings)
polyfit(log(xx(end-5:end)),log(timings(end-5:end)),1)


% If time permits...


nums=randi(100,10,1)


% What if we want to calculate a cumulative sum every time an entry changes?
total = zeros(10,1);
total(1)=nums(1);
for i=2:numel(nums)
    total(i) = total(i-1) + nums(i);
end
before=total


nums(randi(numel(nums)))=99


total(1)=nums(1);
for i=2:numel(nums)
    total(i) = total(i-1) + nums(i);
end
after=total


after-before


% How can we modify this to take advantage of our *a priori* knowledge?
total = zeros(10,1);
total(1)=nums(1);
for i=2:numel(nums)
    total(i) = total(i-1) + nums(i);
end
before=total


%%file myfib.m

function f = myfib(n)
    if n < 2
        f = n;
        return
    else
        f = myfib(n-1) + myfib(n-2);
    end
end


tic
myfib(10)
toc


timer = zeros(40,1);
for i=1:40
    tic
    myfib(i);
    timer(i) = toc;
    if i>30
        i
    end
end


loglog(timer(10:end))


nums=randi(100,10,1)


N = numel(nums);
total = nums;
for i=2:N
    total(i) = total(i-1) + nums(i);
end
total


myboxes = [9, 11, 7, 20, 1, 19];
items = [1, 3, 4, 10, 19];
max_weight = 20;

res = zeros(numel(myboxes),numel(items));
c = 1;
for i=myboxes
    res(c,:)=(i + items);
    c=c+1;
end
res
res<=max_weight


repmat(myboxes',1,numel(items))+repmat(items,numel(myboxes),1)


bsxfun(@plus,myboxes',items)


cool


A=toeplitz([[1 1] zeros(1,5-2)])


cool
A*cool*A


tic
for t=1:100000
    total = 0;
    for i=1:10000
        total = total + i;
    end
end
toc

tic
for t=1:100000
    total = sum(1:10000);
end
toc


total

What is "performance optimization"?¶

Memory access efficiency¶

Vectorization¶

a priori knowledge¶

Language strengths/weaknesses¶

Algorithmic improvements¶

Advanced Vectorization Methods¶

Instrumentation/metrics¶

Recommended algorithms starting places:¶