1%% Example: Using setReward
for reward-based CTMC analysis
2% This example demonstrates the setReward feature
for defining custom
3% reward functions on a queueing network model and computing steady-state
4% expected rewards
using the CTMC solver.
6% Copyright (c) 2012-2026, Imperial College London
12% Create a simple M/M/1/K queue with finite buffer
14model = Network(
'RewardExample');
17source = Source(model,
'Source');
18queue = Queue(model,
'Queue', SchedStrategy.FCFS);
19sink = Sink(model,
'Sink');
21% Set finite buffer capacity
22queue.setNumberOfServers(1);
23queue.setCapacity(3); % Maximum jobs in the system
26oclass = OpenClass(model,
'Class1');
27source.setArrival(oclass, Exp(2)); % Arrival rate = 2
28queue.setService(oclass, Exp(3)); % Service rate = 3 (utilization ~ 0.67)
31model.link(Network.serialRouting(source,queue,sink));
33%% Define Reward Functions
34% setReward(name, @(state, sn) -> reward_value)
35% The function receives the aggregated state vector and network structure
37% Reward 1: Queue length (number of jobs in the queue)
38% State format
for this model: state = [jobs_at_queue]
39model.setReward(
'QueueLength', @(state, sn) state(2));
41% Reward 2: Utilization (1
if server busy, 0
if idle)
42% Server
is busy
if at least 1 job
is present
43model.setReward(
'Utilization', @(state, sn) min(state(2), 1));
45% Reward 3: Blocking indicator (1
if buffer full, 0 otherwise)
46% Buffer
is full when jobs = capacity (10)
47model.setReward('BlockingProb', @(state, sn) (state(2) >= 10));
49% Reward 4: Weighted queue cost (quadratic penalty for
long queues)
50model.setReward('QueueCost', @(state, sn) state(2)^2);
52%% Solve with CTMC Solver
53fprintf('Solving with CTMC solver...\n\n');
55options = Solver.defaultOptions;
58solver = CTMC(model, options);
60%% Get Steady-State Expected Rewards
61[R, names] = solver.getAvgReward();
63fprintf('\n=== Steady-State Expected Rewards ===\n');
64for i = 1:length(names)
65 fprintf('%15s: %.6f\n', names{i}, R(i));
68%% Get Transient Reward Analysis
69% Get full reward trajectories over time
70[t, V, names, stateSpace] = solver.getReward();
72fprintf(
'\n=== State Space ===\n');
73fprintf(
'Number of states: %d\n', size(stateSpace, 1));
74fprintf(
'State dimensions: %d\n', size(stateSpace, 2));
76%% Plot Reward Convergence
77figure(
'Name',
'Reward Convergence',
'Position', [100 100 800 600]);
79nRewards = length(names);
83 % Plot mean reward rate over time (averaged over all initial states)
84 meanReward = mean(V{r}, 2); % Average over states
86 % Compute reward rate (reward per unit time)
87 rewardRate = zeros(length(t), 1);
89 rewardRate(k) = meanReward(k) / t(k);
92 plot(t(2:end), rewardRate(2:end),
'LineWidth', 1.5);
94 yline(R(r),
'r--',
'LineWidth', 1.5);
98 ylabel(
'Expected Reward Rate');
99 title(sprintf(
'%s (Steady-state: %.4f)', names{r}, R(r)));
100 legend(
'Transient',
'Steady-state',
'Location',
'best');
104sgtitle(
'Convergence of Reward Functions to Steady-State');
106%% Compare with Analytical Results
for M/M/1/K
107fprintf(
'\n=== Comparison with M/M/1/K Analytical Results ===\n');
109lambda = 2; % Arrival rate
110mu = 3; % Service rate
112K = 10; % Buffer capacity
114% For M/M/1/K queue, steady-state probabilities:
115% pi(n) = (1-rho) * rho^n / (1 - rho^(K+1))
119 pi(n+1) = (1 - rho) * rho^n / (1 - rho^(K+1));
122 pi = ones(K+1, 1) / (K+1);
125% Analytical expected queue length
126L_analytical = sum((0:K)
' .* pi);
128% Analytical utilization (P(server busy) = 1 - pi(0))
129U_analytical = 1 - pi(1);
131% Analytical blocking probability = pi(K)
132B_analytical = pi(end);
134% Analytical queue cost (E[N^2])
135Cost_analytical = sum(((0:K).^2)' .* pi);
137fprintf(
'%15s: LINE = %.6f, Analytical = %.6f, Error = %.2e\n', ...
138 'QueueLength', R(1), L_analytical, abs(R(1) - L_analytical));
139fprintf(
'%15s: LINE = %.6f, Analytical = %.6f, Error = %.2e\n', ...
140 'Utilization', R(2), U_analytical, abs(R(2) - U_analytical));
141fprintf(
'%15s: LINE = %.6f, Analytical = %.6f, Error = %.2e\n', ...
142 'BlockingProb', R(3), B_analytical, abs(R(3) - B_analytical));
143fprintf(
'%15s: LINE = %.6f, Analytical = %.6f, Error = %.2e\n', ...
144 'QueueCost', R(4), Cost_analytical, abs(R(4) - Cost_analytical));
146fprintf(
'\nExample completed successfully.\n');