def gale_shapley(
    a_pref: dict[str, list[str]], 
    b_pref: dict[str, list[str]]
) -> dict[str, str]:
    unmatcheda = list(a_pref.keys())
    matches = {}
    rejects = {a: [] for a in a_pref}
    
    while unmatcheda:
        ai = unmatcheda.pop() # choose i
        b = a_pref[ai] # consider a_i's preferences (list of b's)
        for bj in b:
            if bj in rejects[ai]: # b_j has already rejected a_i
                continue
            elif bj not in matches: # b_j is unmatched
                matches[bj] = ai # match a_i and b_j
                break # move to the next unmatched a_i
            elif b_pref[bj].index(ai) < b_pref[bj].index(matches[bj]): # b_j prefers a_i to its current match
                unmatcheda.append(matches[bj]) # b_j unmatches with current match
                matches[bj] = ai # match a_i and b_j
                break # move to the next unmatched a_i
            else:
                rejects[ai].append(bj) # b_j rejects a_i
    return {bj: matches[bj] for bj in sorted(matches)}

import random
def shuffle_prefs(prefs):
    for x in prefs:
        random.shuffle(prefs[x])
    return prefs

a_pref = {
    'A': ['X', 'Y', 'Z'],
    'B': ['Y', 'X', 'Z'],
    'C': ['Z', 'Y', 'X']
}

b_pref = {
    'X': ['B', 'A', 'C'],
    'Y': ['C', 'B', 'A'],
    'Z': ['A', 'C', 'B']
}

print(gale_shapley(a_pref, b_pref))
print(gale_shapley(shuffle_prefs(a_pref), shuffle_prefs(b_pref)))
print(gale_shapley(shuffle_prefs(a_pref), shuffle_prefs(b_pref)))
print(gale_shapley(shuffle_prefs(a_pref), shuffle_prefs(b_pref)))

{'X': 'A', 'Y': 'B', 'Z': 'C'}
{'X': 'B', 'Y': 'C', 'Z': 'A'}
{'X': 'B', 'Y': 'A', 'Z': 'C'}
{'X': 'C', 'Y': 'B', 'Z': 'A'}

def interval_scheduling_max_jobs(
    jobs: dict[int, tuple[int, int]]
) -> list[int]:
    res = []
    prev_end_time = -1
    # sort jobs by end time
    jobs_sorted = sorted(jobs.items(), key=lambda x: x[1][1])

    for job, (start, end) in jobs_sorted:
        if start >= prev_end_time:
            res.append(job)
            prev_end_time = end

    return res

j1 = {1: (0, 6), 2: (1, 4), 3: (3, 5), 4: (5, 7), 5: (5, 9)}
sched1 = interval_scheduling_max_jobs(j1)
print(f"scheduled jobs: {sched1}")

j2 = {6: (2, 5), 7: (4, 8), 8: (6, 10), 9: (0, 3), 10: (7, 11), 11: (30, 40), 12: (12, 13), 13: (100, 200)}
sched2 = interval_scheduling_max_jobs(j2)
print(f"scheduled jobs: {sched2}")

j3 = {14: (5, 9), 15: (8, 12), 16: (1, 2), 17: (2, 4), 18: (3, 6)}
sched3 = interval_scheduling_max_jobs(j3)
print(f"scheduled jobs: {sched3}")

scheduled jobs: [2, 4]
scheduled jobs: [9, 7, 12, 11, 13]
scheduled jobs: [16, 17, 14]

def interval_scheduling_min_max_lateness(
    jobs: dict[int, tuple[int, int]]
) -> (list[int], int):
    res = []
    current_time = 0
    max_lateness = 0
    # sort jobs by deadline
    jobs_sorted = sorted(jobs.items(), key=lambda x: x[1][1])
    
    for jobno, (duration, deadline) in jobs_sorted:
        current_time += duration  
        max_lateness = max(max_lateness, max(0, current_time - deadline)) 
        res.append(jobno)

    return res, max_lateness

j1 = {1: (2, 4), 2: (1, 3), 3: (2, 5), 4: (3, 7)}
sched1, max_lateness1 = interval_scheduling_min_max_lateness(j1)
print(f'schedule: {sched1}, max lateness: {max_lateness1}')

j2 = {1: (3, 6), 2: (2, 4), 3: (1, 3)}
sched2, max_lateness2 = interval_scheduling_min_max_lateness(j2)
print(f'schedule: {sched2}, max lateness: {max_lateness2}')

j3 = {1: (4, 5), 2: (2, 2), 3: (1, 4), 4: (3, 7)}
sched3, max_lateness3 = interval_scheduling_min_max_lateness(j3)
print(f'schedule: {sched3}, max lateness: {max_lateness3}')

j4 = {1: (1, 2), 2: (2, 5), 3: (3, 8), 4: (1, 3)}
sched4, max_lateness4 = interval_scheduling_min_max_lateness(j4)
print(f'schedule: {sched4}, max lateness: {max_lateness4}')

j5 = {1: (2, 3), 2: (1, 4), 3: (3, 6)}
sched5, max_lateness5 = interval_scheduling_min_max_lateness(j5)
print(f'schedule: {sched5}, max lateness: {max_lateness5}')

schedule: [2, 1, 3, 4], max lateness: 1
schedule: [3, 2, 1], max lateness: 0
schedule: [2, 3, 1, 4], max lateness: 3
schedule: [1, 4, 2, 3], max lateness: 0
schedule: [1, 2, 3], max lateness: 0

import heapq

def dijkstra(graph: dict[str, tuple[str, int]], start: str) -> tuple[dict[str, float], dict[str, str|None]]:
    distances = {node: float('inf') for node in graph}
    distances[start] = 0
    predecessors = {node: None for node in graph}

    priority_queue = [(0, start)]

    while priority_queue:
        current_distance, current_node = heapq.heappop(priority_queue)

        for neighbor, weight in graph[current_node]:
            distance = current_distance + weight

            if distance < distances[neighbor]:
                distances[neighbor] = distance
                predecessors[neighbor] = current_node
                heapq.heappush(priority_queue, (distance, neighbor))

    return distances, predecessors

def shortest_path(graph: dict[str, tuple[str, int]], start: str, end: str) -> tuple[str, float]:
    distances, predecessors = dijkstra(graph, start)
    path = []
    current_node = end

    while current_node is not None:
        path.insert(0, current_node)
        current_node = predecessors[current_node]

    return (path, distances[end]) if path[0] == start else ("NO PATH", float('inf'))

graph = {
    'A': [('B', 3), ('C', 1), ('E', 2)],
    'B': [('D', 2), ('E', 4)],
    'C': [('B', 2), ('F', 5)],
    'D': [('E', 1), ('G', 8)],
    'E': [('H', 5)],
    'F': [('E', 1), ('H', 6)],
    'G': [('H', 4)],
    'H': []
}
p1, d1 = shortest_path(graph, 'A', 'D')
print(f"Shortest path from 'A' to 'D': {p1}, distance: {d1}")
p2, d2 = shortest_path(graph, 'A', 'E')
print(f"Shortest path from 'A' to 'E': {p2}, distance: {d2}")
p3, d3 = shortest_path(graph, 'A', 'G')
print(f"Shortest path from 'A' to 'G': {p3}, distance: {d3}")

Shortest path from 'A' to 'D': ['A', 'B', 'D'], distance: 5
Shortest path from 'A' to 'E': ['A', 'E'], distance: 2
Shortest path from 'A' to 'G': ['A', 'B', 'D', 'G'], distance: 13

CMSC 27200: Theory of Algorithms¶

Contents¶

Gale-Shapley (Stable Matching)

Big-O Notation

Interval Scheduling

Maximising the number of jobs accepted¶

Minimising maximum lateness¶

Dijkstra's Algorithm (Shortest Path)

Data Structures

Minimum Spanning Trees

Kruskal's Algorithm¶

Prim's Algorithm¶

Correctness of MST Algorithms¶

Solving Recurrence Relations

Master Theorem¶

Recursive Algorithms

Binary Search¶

Finding Local Maximum¶

Mergesort¶

Counting Inversions

Closest Pair of Points

Karatsuba Multiplication Algorithm

Dynamic Programming

Weighted Interval Scheduling

Bellman-Ford Algorithm for Shortest Path

Knapsack Problem

Longest Common Subsequence

Non-crossing matchings**