"""
Experiment 1: Utilisation Ramp (M/M/1)
-------------------------------------------------
Model a single-GP triage system using an M/M/1 queue.
Plot arrival rate (lambda) against utilisation (rho) and average waiting time (wq).

Assumptions:
- Poisson arrival times (random and memoryless)
- Exponential service times
- service rate (mu) averages 12 patients/hour
"""

import matplotlib.pyplot as plt
import numpy as np


def calculate_utilisation_and_wait(mu: float, lambdas: np.ndarray) -> tuple[np.ndarray, np.ndarray]:
    """
    calculate utilisation (rho) and mean wait time (q)
    
    Parameters:
    mu : float
        service rate (patients per hour)
    lambdas: np,ndarray
        Array of arrival rates (patients per hour)

    Returns:
    tuple[np.ndarray, np.darray]
        arrays of utilisation (rho) and waiting time (Wq) in minutes.
    """
    rho = lambdas / mu
    wq_hours = rho / (mu - lambdas)
    wq_minutes = wq_hours * 60
    return rho, wq_minutes


def plot_utilisation_and_wait(lambdas: np.ndarray, rho: np.ndarray, wq: np.ndarray) -> None:
     
    """
    Plot lambda vs rho and Wq
    
    Parameters:
    lambdas : np.ndarray
        Array of arrival rates (patients per hour)
    rho : np.ndarray
        Array of utilisation factors 
    wq: np.ndarray
        Array of waiting times (minutes)
    """
    fig, ax1 = plt.subplots()
    
    # plot utilisation on left Y axis
    ax1.plot(lambdas, rho, 'o-', color='tab:blue', label = 'Utilisation (ρ)')
    ax1.set_xlabel("Arrival rate λ (patients/hour)")
    ax1.set_ylabel("Utilisation factor ρ", color='tab:blue')
    ax1.tick_params(axis='y', labelcolor='tab:blue')
    ax1.set_ylim(0, 1)
    
    # Plot waiting time on the right y-axis
    ax2 = ax1.twinx()
    ax2.plot(lambdas, wq, 's--', color='tab:red', label='Waiting time Wq (minutes)')
    ax2.set_ylabel("Average waiting time Wq (minutes)", color='tab:red')
    ax2.tick_params(axis='y', labelcolor='tab:red')
    
    # Title
    plt.title("GP Online Triage. M/M/1 Queue, service rate μ= 12/hr")
    
    # Formatting
    fig.tight_layout()

    plt.show()


# --- Parameters ---
MU = 12.0 # service rate (patients/hour)
# Arrival rate lambda varies from 4 to 11 patients/hour
lambdas = np.array([i for i in range (4,12)], dtype=float)


# --- Execution ---
# Calculate ulitisation and wait
rho, wq = calculate_utilisation_and_wait(MU, lambdas)

# Plot results
plot_utilisation_and_wait(lambdas, rho, wq)

"""
Experiment 2: Meeting service target (M/M/1)
-------------------------------------------------
Model a single-GP triage system using an M/M/1 queue.
Plot arrival rate (lambda) against service rate (mu) required
to ensure that 90% of triage requests are started within
30 minutes.

Assumptions:
- Target: 90% start within 30 minutes
- Poisson arrival and exponential service times
"""

import matplotlib.pyplot as plt
import numpy as np
import math
from scipy.special import lambertw

def calculate_required_mus(lambdas: np.ndarray, t: float = 0.5, target: float = 0.9) -> float:
    """
    Solve for μ in the M/M/1 queue with the condition:
        P(wait ≤ t) = target
    where:
        target = 1 - (λ/μ) * exp(-(μ - λ)t)

    Parameters:
    lambdas : np.ndarray
        Array of arrival rates (patients per hour)
    t : float
        Target time (hours)
    target : float
        Target probability (e.g., 0.9 for 90%)

    Returns:
    np.ndarray
        Array of required service rates (patients per hour)
    """
    p = 1 - target
    required_mus = np.zeros_like(lambdas)
    for lam in lambdas:  
        arg = (lam * t / p) * math.exp(lam * t)
        mu = lambertw(arg).real / t
        required_mus[lambdas == lam] = mu   
    return required_mus


def plot_required_mus(required_mus: np.ndarray, lambdas: np.ndarray) -> None:
     
    """
    Plot required serivce times against arrival rates.
    
    Parameters:
    required_mus: np.ndarray 
        Array of the  required ervice rates (patients per hour).
    lambdas : np.ndarray
        Array of arrival rates (patient per hour)
    """
    plt.figure(figsize=(7, 5))
    plt.plot(lambdas, required_mus, marker='s', label='Mean service time allowed (min)')
    plt.xlabel('Arrival rate λ (patients/hour)')
    plt.ylabel('Mean service time (minutes)')
    plt.title('Service rate required for 90% of triages to start within 30 minutes')
    plt.legend()
    plt.grid(True)

    plt.show()

# --- Parameters ---
T = 30 / 60  # 30 minutes in hours
target = 0.9 # 90% within target time
lambdas = np.arange(4, 12)  # 4 to 11 arrivals per hour


# --- Compute required μ values ---
mus = calculate_required_mus(lambdas, T, target)
service_times = 60 / mus  # minutes per patient

plot_required_mus(service_times, lambdas)

"""
Experiment 3: Complete or signpost? (M/G/1)
-------------------------------------------------
Model a single-GP triage system using an M/G/1 queue.
Plot the maximum proportion of full completions (p)
that can be sustained for different arrival rates (λ),
while still meeting the service target that 90 % of
triage requests are started within 30 minutes.

Assumptions:
- Target: 90% start within 30 minutes
- Poisson arrival times
- Two-point service time distribution:
    - Complete, with probability p, mean time S1 = 10 minutes
    - Signpost, with probability (1-p), mean time S2 = 3 minutes
- Effective mean service time  E[S] = (7p + 3) minutes
    - Service rate  μ = 60 / (7p + 3) patients per hour
"""

import matplotlib.pyplot as plt
import math
import numpy as np
from scipy.special import lambertw


def calculate_mu_required(lam: float, t: float =30/60, target: float =0.9) -> float:
    """
    Solve for the required service rate μ such that
    P(wait ≤ t) = target  in an M/G/1 queue.

    Parameters:
    lam : float
        arrival rate (patients per hour)
    t : float
        Target time (hours)
    target : float
        Target probability (e.g., 0.9 for 90%) 

    Returns:
    float
        required service rate (patients per hour)   
    """
    p = 1 - target
    arg = (lam * t / p) * math.exp(lam * t)
    return (lambertw(arg).real) / t


def pmax_from_mu(mus_required: np.ndarray) -> np.ndarray:
    """
    Compute the maximum feasible proportion of completed
    cases (p) given the required μ value. Where
    p ≤ (60 / μ − 3) / 7, clipped to [0, 1].

    Parameters:
    mus_required : np.ndarray
        Array of required service rates (patients per hour)
    
    Returns:
    np.ndarray
        Array of maximum feasible completion proportions (p)         
    """
    return np.clip((60 / mus_required - 3) / 7, 0, 1)


def plot_max_completion_share(pmax: np.ndarray, lambdas: np.ndarray) -> None:
    """
    Plot maximum feasible completion share against arrival rates.
    
    Parameters:
    pmax: np.ndarray 
        Array of the maximum fdeasible completion proportions (p).
    lambdas : np.ndarray
        Array of arrival rates (patient per hour)
    """
    plt.figure(figsize=(7, 5))
    plt.plot(lambdas, pmax, marker='o')
    plt.ylim(0,1); plt.grid(True, alpha=.3)
    plt.xlabel('Arrival rate λ (per hour)')
    plt.ylabel('Max completion share p')
    plt.title('Max % of cases GP can complete while keeping 90% start ≤ 30 min')
    plt.show()
    

# --- Parameters ---
lambdas = np.arange(4, 12)        # arrivals per hour (4–11)
t = 30 / 60                       # target time (hours)
target = 0.9                       # target probability (90%)


# --- Execution ---
mus_required = np.array([calculate_mu_required(lam, t, target) for lam in lambdas])
pmax = pmax_from_mu(mus_required)
plot_max_completion_share(pmax, lambdas)

"""
Experiment 4: Mean Waiting Time (M/G/1)
----------------------------------------

Model a single-GP triage system using an M/G/1 queue
with a two-point service-time distribution.

Objective:
Explore how the mean waiting time in the queue (Wq)
depends on the proportion of full completions (p)
and the arrival rate (λ).

Assumptions:
- Poisson arrivals (rate λ per hour)
- Service time distribution:
    • Complete: 10 minutes, probability p
    • Signpost: 3 minutes, probability (1-p)
- Mean service time  E[S] = (3 + 7p) minutes
- Mean squared service time  E[S²] = (9 + 91p) minutes²
- Pollaczek–Khinchine (M/G/1) waiting-time formula:
    described in MD cell above
"""

import numpy as np
import matplotlib.pyplot as plt


def mean_wait(lam: float, p: float) -> np.ndarray:
    """
    Calculate the M/G/1 mean waiting time in queue (minutes)
    for a two-point service-time distribution:
        S1 = 10 min with probability p
        S2 =  3 min with probability (1 - p)

    Parameters
    ----------
    lam : float or np.ndarray
        Arrival rate λ (per hour)
    p : float or np.ndarray
        Proportion of full 10-minute completions (0 ≤ p ≤ 1)

    Returns
    -------
    np.ndarray
        Mean waiting time in queue Wq (minutes)
    """
    # Expected service time and second moment in minutes
    ES_min  = 3 + 7 * p        # E[S]
    ES2_min = 9 + 91 * p       # E[S²]

    # Convert to hours and hours²
    ES_h  = ES_min / 60
    ES2_h = ES2_min / 3600

    # Utilisation factor clipped to [0:1]
    rho = lam * ES_h
    rho = np.clip(rho, None, 0.999999)

    # Pollaczek–Khinchine formula for M/G/1
    Wq_h = np.where(rho < 1, lam * ES2_h / (2 * (1 - rho)), np.inf)
    return 60 * Wq_h  # convert from hours to minutes


def plot_mean_waiting_time(lambdas: np.ndarray, ps: np.ndarray) -> None:
    """
    Plot mean queue waiting time (Wq) against completion proportion (p)
    for a range of arrival rates (λ).

    Parameters
    ----------
    lambdas : np.ndarray
        Array of arrival rates (patients/hour)
    ps : np.ndarray
        Array of completion proportions (0 ≤ p ≤ 1)
    """
    plt.figure(figsize=(7, 5))

    for lam in lambdas:
        Wq = mean_wait(lam, ps)
        plt.plot(ps, Wq, label=f"λ = {lam}/h")

    plt.axhline(30, ls="--", alpha=0.4, color="gray")  # 30 min target line
    plt.ylim(0, 180)
    plt.xlabel("Completion share p")
    plt.ylabel("Mean waiting time Wq (minutes)")
    plt.title("M/G/1 Mean Queue Wait vs Completion Share")
    plt.legend(ncol=2, fontsize=8)
    plt.grid(True, alpha=0.3)
    plt.tight_layout()
    plt.show()


# --- Parameters ---
lambdas = np.arange(5, 13)     # arrival rates: 5 → 12 per hour
ps = np.linspace(0, 1, 51)     # completion proportions: 0 → 1


# --- Execution ---
plot_mean_waiting_time(lambdas, ps)

"""
Experiment 5: Effect of Adding Triaging GPs (M/M/s)
----------------------------------------------------

Model a triage system with multiple GPs (servers) working in parallel,
using the M/M/s queueing model.

Objective:
Quantify how adding additional triaging GPs (s) affects mean waiting time
in the queue (Wq), assuming each GP triages at the same average rate (μ).

Assumptions:
- Poisson arrivals (λ per hour)
- Exponential service times with mean rate μ = 12 patients/hour (~5 min per case)
- Servers work independently but share the same queue
- Number of triagers s ∈ {1, 2, 3}
- Erlang C formula for the probability of waiting:
    expressed in the MD cell above
- Mean waiting time in queue:
    formula expressed in the MD cell above
"""

import math
import numpy as np
import matplotlib.pyplot as plt


def erlang_c(lam: float, mu: float, s: int) -> float:
    """
    Calculate the Erlang C probability (Pw),
    the probability that an arrival has to wait,
    for an M/M/s queue.

    Parameters
    ----------
    lam : float
        Arrival rate (patients/hour)
    mu : float
        Service rate per server (patients/hour)
    s : int
        Number of servers (triaging GPs)

    Returns
    -------
    float
        Probability that an arrival must wait (Erlang C)
    """
    rho = lam / (s * mu)
    if rho >= 1:
        return 1.0  # an unstable system - return result for 100$ utliisation

    num = (lam / mu) ** s / (math.factorial(s) * (1 - rho))
    denom = sum((lam / mu) ** n / math.factorial(n) for n in range(s)) + num
    return num / denom


def mean_wait_mm_s(lam: float, mu: float, s: int) -> float:
    """
    Compute the mean waiting time in queue (Wq, hours)
    for an M/M/s queue using the Erlang C formula.

    Parameters
    ----------
    lam : float
        Arrival rate (patients/hour)
    mu : float
        Service rate per server (patients/hour)
    s : int
        Number of servers

    Returns
    -------
    float
        Mean waiting time in queue (hours)
    """
    rho = lam / (s * mu)
    if rho >= 1:
        return np.inf  # unstable system, work with 100$ utilisation
    Pw = erlang_c(lam, mu, s)
    return Pw / (s * mu - lam)


def plot_mm_s_waiting_times(mu: float, lambdas: np.ndarray, servers: list[int]) -> None:
    """
    Plot mean waiting time in queue (minutes) versus arrival rate (λ)
    for different numbers of triaging GPs (s).

    Parameters
    ----------
    mu : float
        Service rate per GP (patients/hour)
    lambdas : np.ndarray
        Array of arrival rates (patients/hour)
    servers : list[int]
        List of numbers of GPs (servers) to simulate
    """
    plt.figure(figsize=(8, 5))

    for s in servers:
        Wq_hours = np.array([mean_wait_mm_s(lam, mu, s) for lam in lambdas])
        Wq_minutes = 60 * Wq_hours
        plt.plot(lambdas, Wq_minutes, marker="o", label=f"{s} triager{'s' if s > 1 else ''}")

    plt.xlabel("Arrival rate λ (patients/hour)")
    plt.ylabel("Mean queue wait $W_q$ (minutes)")
    plt.title("Experiment 5 — Effect of Adding Triaging GPs (M/M/s)")
    plt.ylim(0, 120)
    plt.legend()
    plt.grid(alpha=0.3)
    plt.tight_layout()
    plt.show()


# --- Parameters ---
mu = 12.0                  # each GP: 12 patients/hour (=5 min)
lambdas = np.arange(4, 41) # arrivals per hour
servers = [1, 2, 3]        # 1, 2, or 3 triagers


# --- Execution ---
plot_mm_s_waiting_times(mu, lambdas, servers)

"""
Experiment 6: Minimum Staffing to Meet SLA (M/M/s)
----------------------------------------------------

Model a triage system with multiple GPs (servers) using an M/M/s queue.

Objective:
Determine the minimum number of triaging GPs (s) required to meet a
specific Service Level Agreement (SLA), e.g. 90% of triage requests
must start within 30 minutes.

Assumptions:
- Poisson arrivals (λ per hour)
- Exponential service times with mean rate μ = 12 patients/hour (= 5 min per case)
- Shared single queue served by s identical triagers
- SLA target: 90% of patients begin triage within 30 minutes
- Erlang C probability of waiting:
    formula expressed in the MD cell above
- Probability that a patient starts triage within time t:
    formula expressed in the MD cell above
"""

import math
import numpy as np
import matplotlib.pyplot as plt


def erlang_c(lam: float, mu: float, s: int) -> float:
    """
    Calculate the Erlang C probability (Pw),
    the probability that an arrival must wait, for an M/M/s queue.

    Parameters
    ----------
    lam : float
        Arrival rate (patients/hour)
    mu : float
        Service rate per server (patients/hour)
    s : int
        Number of servers (triaging GPs)

    Returns
    -------
    float
        Probability that an arrival must wait
    """
    rho = lam / (s * mu)
    if rho >= 1:
        return 1.0  # unstable system, work with 100% utilisation
    a = lam / mu
    num = (a**s) / (math.factorial(s) * (1 - rho))
    denom = sum((a**n) / math.factorial(n) for n in range(s)) + num
    return num / denom


def p_wait_leq_t(lam: float, mu: float, s: int, t_hours: float) -> float:
    """
    Calculate the probability that a patient waits ≤ t_hours
    in an M/M/s queue.

    Parameters
    ----------
    lam : float
        Arrival rate (patients/hour)
    mu : float
        Service rate per server (patients/hour)
    s : int
        Number of servers
    t_hours : float
        Target wait threshold (hours)

    Returns
    -------
    float
        Probability that waiting time ≤ t_hours
    """
    if lam >= s * mu:
        return 0.0  # unstable system return probability 0
    Pw = erlang_c(lam, mu, s)
    rate = s * mu - lam
    return 1.0 - Pw * math.exp(-rate * t_hours)


def min_servers_for_sla(lam: float, mu: float, t_hours: float, target: float = 0.9, s_max: int = 20) -> float:
    """
    Determine the minimum number of servers (s)
    required to meet an SLA target (P(Wq ≤ t) ≥ target).

    Parameters
    ----------
    lam : float
        Arrival rate (patients/hour)
    mu : float
        Service rate per server (patients/hour)
    t_hours : float
        SLA threshold time (hours)
    target : float, default = 0.9
        Target probability (e.g. 0.9 for 90%)
    s_max : int, default = 20
        Maximum number of servers to test

    Returns
    -------
    float
        Minimum s meeting SLA, or NaN if not found
    """
    for s in range(1, s_max + 1):
        if lam < s * mu:
            pw_leq = p_wait_leq_t(lam, mu, s, t_hours)
            if pw_leq >= target:
                return s
    return np.nan


def plot_min_servers_for_sla(
    lambdas: np.ndarray,
    mu: float,
    t_hours: float,
    target: float,
) -> None:
    """
    Plot the minimum number of triagers (s) required
    to meet a given SLA for various arrival rates.

    Parameters
    ----------
    lambdas : np.ndarray
        Array of arrival rates (patients/hour)
    mu : float
        Service rate per server (patients/hour)
    t_hours : float
        SLA threshold (hours)
    target : float
        SLA target probability (e.g. 0.9)
    """
    s_required = [min_servers_for_sla(lam, mu, t_hours, target) for lam in lambdas]

    plt.figure(figsize=(8, 5))
    plt.step(lambdas, s_required, where="post", color="tab:orange", label=f"{int(target*100)}% ≤ {int(t_hours*60)} min")

    plt.xlabel("Arrival rate λ (patients/hour)")
    plt.ylabel("Minimum triagers (s)")
    plt.title("Experiment 6 — Minimum Triagers Required to Meet SLA (M/M/s)")
    plt.grid(alpha=0.3)
    plt.legend()
    plt.yticks(range(1, int(np.nanmax(s_required)) + 1))
    plt.tight_layout()
    plt.show()


# --- Parameters ---
mu = 12.0                  # service rate per triager (patients/hour)
target = 0.90              # SLA: 90% start within t
lambdas = np.arange(4, 41) # arrivals/hour: 4–40
t_30 = 30 / 60             # 30 minutes in hours


# --- Execution ---
plot_min_servers_for_sla(lambdas, mu, t_30, target)

Application of Healthcare Queueing Models to Online Triage Systems in Primary Care¶

Introduction: Queueing in Healthcare¶

Triage in Primary Care¶

Study Design¶

Model 1: GP Same‑day Triage (M/M/1)¶

Experiment 1: Utilisation ramp¶

Experiment 1: Results¶

Experiment 2 — Meeting service target¶

Experiment 2: results¶

Model 2: Completing versus signposting (M/G/1)¶

Experiment 3 - Complete or signpost? (M/G/1)¶

Experiment 3: Results¶

Experiment 4 - Mean waiting time (M/G/1)¶

Experiment 4: Results¶

Model 3: multiple triaging GPs (M/M/s)¶

Experiment 5 — Effect of adding more triaging GPs (M/M/s)¶

Experiment 5: Results¶

Experiment 6: Capacity planning (M/M/s)¶

Experiment 6: Results¶

Summary and Conclusion¶

Limitations¶

Future work¶

Generative AI usage¶

References¶