Question No: 9
Context Size: 17199

Codebase:

File: matrix_search.py:

```Python
from typing import List, Tuple
from typing import List
from typing import Dict, List
import numpy as np
from typing import Dict
import re

def pathfinder(grid: List[List[int]], start: Tuple[int, int], end: Tuple[int, int]) -> List[Tuple[int, int]]:
    directions = [(0, 1), (0, -1), (1, 0), (-1, 0)]
    queue = [(start, [start])]
    
    while queue:
        (x, y), path = queue.pop(0)
        if (x, y) == end:
            return path
        for dx, dy in directions:
            nx, ny = x + dx, y + dy
            if 0 <= nx < len(grid) and 0 <= ny < len(grid[0]) and grid[nx][ny] == 1 and (nx, ny) not in path:
                queue.append(((nx, ny), path + [(nx, ny)]))
    
    return None

def shortest_concatenated_string(strings: List[str], max_length: int, target_string: str) -> str:
    concatenated_string = ""
    
    for string in strings:
        if target_string in string and len(concatenated_string) + len(string) <= max_length:
            concatenated_string += string
            break
        elif len(concatenated_string) + len(string) <= max_length:
            concatenated_string += string
    
    return concatenated_string

def search_matrix(matrix: List[List[int]], target: int) -> Tuple[int, int]:
    if not matrix or not matrix[0]:
        return -1, -1
    
    rows, cols = len(matrix), len(matrix[0])
    row, col = 0, cols - 1
    
    while row < rows and col >= 0:
        current = matrix[row][col]
        if current == target:
            return row, col
        elif current > target:
            col -= 1  # Move left
        else:
            row += 1  # Move down
    
    return -1, -1  # Target not found

def lowest_common_ancestor(tree: Dict[int, List[int]], root: int) -> int:
    ancestors = set()
    stack = [root]
    
    while stack:
        node = stack.pop()
        ancestors.add(node)
        
        for child in tree.get(node, []):
            stack.append(child)
    
    lca = root
    
    for node in ancestors:
        if all(node in ancestors for child in tree.get(node, [])):
            lca = node
    
    return lca

def schedule_jobs(jobs: List[Tuple[int, int]], processors: int) -> int:
    jobs.sort(key=lambda job: job[1])
    processors_load = [0] * processors
    max_lateness = 0
    
    for job in jobs:
        processing_time, deadline = job
        min_load = min(processors_load)
        processor = processors_load.index(min_load)
        
        if processors_load[processor] + processing_time <= deadline:
            processors_load[processor] += processing_time
        else:
            processors_load[processor] += processing_time
            max_lateness = max(max_lateness, processors_load[processor] - deadline)
    
    return max_lateness

def eigenvalue_decomposition(matrix: List[List[float]]) -> List[Tuple[float, List[float]]]:
    numpy_matrix = np.array(matrix)
    eigenvalues, eigenvectors = np.linalg.eig(numpy_matrix)
    
    result = []
    for eigenvalue, eigenvector in zip(eigenvalues, eigenvectors.T):
        result.append((eigenvalue, eigenvector.tolist()))
    
    return result

def longest_subsequence_sum(sequence: List[int], target: int) -> List[int]:
    if not sequence or target == 0:
        return []
    
    num_elements = len(sequence)
    dp = [[0] * (target + 1) for _ in range(num_elements + 1)]
    max_length = 0
    max_ending_index = 0
    
    for i in range(1, num_elements + 1):
        for j in range(1, target + 1):
            if sequence[i - 1] > j:
                dp[i][j] = dp[i - 1][j]
            else:
                dp[i][j] = max(dp[i - 1][j], dp[i - 1][j - sequence[i - 1]] + 1)
            if dp[i][j] > max_length:
                max_length = dp[i][j]
                max_ending_index = i
    
    subsequence = []
    current_index = max_ending_index
    current_target = target
    while current_index > 0 and current_target > 0:
        if dp[current_index][current_target] != dp[current_index - 1][current_target]:
            subsequence.append(sequence[current_index - 1])
            current_target -= sequence[current_index - 1]
        current_index -= 1
    
    subsequence.reverse()
    return subsequence

def find_substrings(text: str, max_length: int) -> List[str]:
    substrings = set()
    
    for length in range(1, max_length + 1):
        for start in range(len(text) - length + 1):
            substrings.add(text[start:start + length])
    
    return sorted(list(substrings))

def lca_queries(tree: List[List[int]], queries: List[List[int]]) -> List[int]:
    n = len(tree)
    lca = [[0] * n for _ in range(n)]
    
    for i in range(n):
        for j in range(n):
            if i == j:
                lca[i][j] = i
            elif j in tree[i]:
                lca[i][j] = i
                lca[j][i] = i
            else:
                for neighbor in tree[i]:
                    if neighbor != j and lca[neighbor][j] != 0:
                        lca[i][j] = lca[neighbor][j]
                        lca[j][i] = lca[i][j]
    
    results = []
    for query in queries:
        results.append(lca[query[0]][query[1]])
    
    return results

def extract_word_frequencies(text: str, min_length: int) -> Dict[str, int]:
    words = re.findall(r'\b\w{%d,}\b' % min_length, text.lower())
    frequency = {}
    
    for word in words:
        frequency[word] = frequency.get(word, 0) + 1
    
    return frequency

def find_smallest_element(array, rotations):
    low, high = 0, len(array) - 1
    
    while low < high:
        mid = (low + high) // 2
        if array[mid] > array[high]:
            low = mid + 1
        else:
            high = mid
    
    return low
```

File: median_subgraph.py:

```Python
from typing import List, Optional
from typing import List
from collections import deque
import heapq
import numpy as np
from sklearn.cluster import KMeans
from sklearn.metrics import silhouette_score
from typing import List, Tuple
from typing import Dict

def calculate_moving_average(time_series: List[float], window_size: int) -> List[Optional[float]]:
    n = len(time_series)
    if window_size > n:
        return [None] * n
    
    moving_averages = [None] * n
    
    for i in range(n):
        if i >= window_size - 1:
            moving_average = sum(time_series[i - window_size + 1:i + 1]) / window_size
            moving_averages[i] = moving_average
            
    return moving_averages

def insert_interval(intervals: List[List[int]], new_interval: List[int]) -> List[List[int]]:
    if not intervals:
        return [new_interval]
    
    result = []
    i = 0
    
    while i < len(intervals) and intervals[i][1] < new_interval[0]:
        result.append(intervals[i])
        i += 1
    
    while i < len(intervals) and intervals[i][0] <= new_interval[1]:
        new_interval[0] = min(new_interval[0], intervals[i][0])
        new_interval[1] = max(new_interval[1], intervals[i][1])
        i += 1
    
    result.append(new_interval)
    
    while i < len(intervals):
        result.append(intervals[i])
        i += 1
    
    return result

def median_component(graph: List[List[int]], vertices: int) -> List[List[List[int]]]:
    total_distance = 0
    distance_matrix = [[float('inf')] * vertices for _ in range(vertices)]
    
    for i in range(vertices):
        distance_matrix[i][i] = 0
    
    for u, v in graph:
        distance_matrix[u][v] = distance_matrix[v][u] = 1
    
    for k in range(vertices):
        for i in range(vertices):
            for j in range(vertices):
                distance_matrix[i][j] = min(distance_matrix[i][j], distance_matrix[i][k] + distance_matrix[k][j])
                total_distance += distance_matrix[i][j]
    
    median_distance = total_distance // (vertices * (vertices - 1) // 2)
    
    visited = [False] * vertices
    median_component = []
    subgraph1 = []
    subgraph2 = []
    
    for start in range(vertices):
        if not visited[start]:
            queue = deque([start])
            visited[start] = True
            subgraph = [start]
            
            while queue:
                node = queue.popleft()
                for neighbor, edge_length in enumerate(distance_matrix[node]):
                    if edge_length == median_distance and not visited[neighbor]:
                        queue.append(neighbor)
                        visited[neighbor] = True
                        subgraph.append(neighbor)
            
            median_component.append(subgraph)
            if len(subgraph) > len(median_component[0]):
                subgraph1 = median_component[0]
                median_component[0] = subgraph
            else:
                subgraph2 = subgraph
    
    return [subgraph1, subgraph2]

def schedule_jobs(schedule, k):
    # Create a priority queue to store available processors
    available_processors = []
    
    # Create a list to store the scheduled jobs
    scheduled_jobs = []
    
    for job in schedule:
        # If there are available processors, schedule the job on the processor with the earliest end time
        if available_processors:
            processor_end_time = heapq.heappop(available_processors)
            scheduled_jobs.append((processor_end_time[1], job))
            heapq.heappush(available_processors, (processor_end_time[0] + job, processor_end_time[1]))
        else:
            # If there are no available processors, schedule the job on a new processor
            scheduled_jobs.append((0, job))
            heapq.heappush(available_processors, (job, len(scheduled_jobs) - 1))
    
    # Return the scheduled jobs
    return scheduled_jobs

def sequence_clustering(sequences: List[List[int]], window_size: int) -> List[int]:
    # Preprocessing: Windowing and flattening the sequences
    windows = [sequence[i:i+window_size] for sequence in sequences for i in range(len(sequence) - window_size + 1)]
    windows = [np.array(window).flatten() for window in windows]
    
    # K-Means clustering with optimal number of clusters determined by Silhouette Coefficient
    silhouette_values = []
    for n_clusters in range(2, 10):
        kmeans = KMeans(n_clusters=n_clusters)
        cluster_labels = kmeans.fit_predict(windows)
        silhouette_avg = silhouette_score(windows, cluster_labels)
        silhouette_values.append(silhouette_avg)
    optimal_n_clusters = np.argmax(silhouette_values) + 2
    
    kmeans = KMeans(n_clusters=optimal_n_clusters)
    cluster_labels = kmeans.fit_predict(windows)
    return cluster_labels

def schedule_jobs(jobs: List[Tuple[int, int]], machines: int) -> List[List[Tuple[int, int]]]:
    pq = [(0, i) for i in range(machines)]
    heapq.heapify(pq)
    scheduled_jobs = [[] for _ in range(machines)]
    
    for job in sorted(jobs):
        _, machine_id = heapq.heappop(pq)
        scheduled_jobs[machine_id].append(job)
        heapq.heappush(pq, (job[1], machine_id))
    
    return scheduled_jobs

def average_top_k_scores(arr: List[int], k: int) -> float:
    if len(arr) < k:
        return 0.0
    
    unique_scores = sorted(set(arr), reverse=True)[:k]
    return sum(unique_scores) / len(unique_scores)

def identify_users_with_no_incoming_transactions(transactions: List[Tuple[int, int, int]], minimum_amount: int) -> List[int]:
    graph = {}
    users_with_no_incoming_transactions = set()
    
    for sender, receiver, amount in transactions:
        if amount < minimum_amount:
            continue
        
        if receiver not in graph:
            graph[receiver] = []
        graph[receiver].append(sender)
        
        if sender not in graph:
            graph[sender] = []
    
    for user in graph:
        if user not in [sender for sender in graph.values() for sender in sender]:
            users_with_no_incoming_transactions.add(user)
    
    return list(users_with_no_incoming_transactions)

def maze_solver(grid: List[List[int]], start: Tuple[int, int], end: Tuple[int, int]) -> List[Tuple[int, int]]:
    directions = [(0, 1), (0, -1), (1, 0), (-1, 0)]
    visited = set()
    stack = [(start, [start])]
    
    while stack:
        (x, y), path = stack.pop()
        if (x, y) == end:
            return path
        if (x, y) in visited:
            continue
        visited.add((x, y))
        for dx, dy in directions:
            nx, ny = x + dx, y + dy
            if (0 <= nx < len(grid) and 0 <= ny < len(grid[0]) and
                grid[nx][ny] == 0 and (nx, ny) not in visited):
                stack.append(((nx, ny), path + [(nx, ny)]))
    
    return []

def kmer_frequencies(sequence: str, k: int) -> Dict[str, int]:
    kmer_freq = {}
    
    for i in range(len(sequence) - k + 1):
        kmer = sequence[i:i+k]
        if kmer in kmer_freq:
            kmer_freq[kmer] += 1
        else:
            kmer_freq[kmer] = 1
    
    return kmer_freq

def stone_game(stones: List[int]) -> int:
    total_weight = sum(stones)
    n = len(stones)
    dp = [[False] * (total_weight // 2 + 1) for _ in range(n + 1)]
    
    dp[0][0] = True
    
    for i in range(1, n + 1):
        weight = stones[i - 1]
        for j in range(total_weight // 2, -1, -1):
            if j < weight:
                dp[i][j] = dp[i - 1][j]
            else:
                dp[i][j] = dp[i - 1][j] or dp[i - 1][j - weight]
                
    max_diff = 0
    for i in range(total_weight // 2, -1, -1):
        if dp[n][i]:
            max_diff = total_weight - 2 * i
            break
            
    return max_diff
```

File: compression_algorithms.py:

```Python
from typing import List
import numpy as np
import random
import sympy as sp
import math
from typing import List, Tuple
from typing import Dict
from typing import Dict, List
from collections import defaultdict
import networkx as nx

def motif_discovery(sequences: List[List[int]], motif_length: int) -> List[int]:
    if not sequences or motif_length <= 0:
        return []
    
    num_sequences = len(sequences)
    sequence_length = len(sequences[0])
    if motif_length > sequence_length:
        return []
    
    init_prob = 1 / (motif_length * num_sequences)
    motif_prob = [[init_prob] * motif_length for _ in range(num_sequences)]
    background_prob = [[1/4] * sequence_length for _ in range(num_sequences)]
    
    for _ in range(100):
        expected_values = [[0] * motif_length for _ in range(num_sequences)]
        for i in range(num_sequences):
            for j in range(sequence_length - motif_length + 1):
                for k in range(motif_length):
                    expected_values[i][k] += motif_prob[i][k] * background_prob[i][j + k]
        
        motif_prob = [[0] * motif_length for _ in range(num_sequences)]
        for i in range(num_sequences):
            for j in range(sequence_length - motif_length + 1):
                motif_prob[i][j % motif_length] += expected_values[i][j % motif_length]
        
        motif_prob = [[prob / sum(motif_prob[i]) for prob in motif_prob[i]] for i in range(num_sequences)]
    
    motif = []
    for i in range(motif_length):
        max_prob = 0
        max_sequence_index = -1
        for j in range(num_sequences):
            if motif_prob[j][i] > max_prob:
                max_prob = motif_prob[j][i]
                max_sequence_index = j
        motif.append(sequences[max_sequence_index][i])
    
    return motif

def newton_raphson_root_finder(expression, max_iterations):
    x = sp.symbols('x')
    f = sp.sympify(expression)
    f_prime = sp.diff(f, x)
    
    x_value = 1.0
    for i in range(max_iterations):
        x_next = x_value - f.subs(x, x_value) / f_prime.subs(x, x_value)
        if abs(x_next - x_value) < 1e-6:
            break
        x_value = x_next
    
    return x_value, i + 1

def multiple_sequence_aligner(sequences: List[str], match_score: int, mismatch_score: int) -> List[str]:
    if len(sequences) == 0:
        return []
    
    # Initialize the score matrix
    score_matrix = [[0] * (len(sequences[0]) + 1) for _ in range(len(sequences))]
    
    # Initialize the alignment matrix
    alignment_matrix = [[[''] * (len(sequences[0]) + 1) for _ in range(len(sequences[0]) + 1)] for _ in range(len(sequences))]
    
    # Fill in the score matrix
    for i in range(len(sequences)):
        for j in range(len(sequences[0]) + 1):
            if j == 0:
                score_matrix[i][j] = 0
            else:
                score_matrix[i][j] = max(score_matrix[i-1][j-1] + (match_score if sequences[i][j-1] == sequences[0][j-1] else mismatch_score),
                                        score_matrix[i-1][j] + mismatch_score,
                                        score_matrix[i][j-1] + mismatch_score)
    
    # Fill in the alignment matrix
    for i in range(len(sequences)):
        for j in range(len(sequences[0]) + 1):
            if j == 0:
                alignment_matrix[i][j][0] = sequences[i][0:j]
            else:
                alignment_matrix[i][j][0] = sequences[i][0:j-1]
                if sequences[i][j-1] == sequences[0][j-1]:
                    alignment_matrix[i][j][0] += sequences[0][j-1]
                else:
                    alignment_matrix[i][j][0] += '-'
    
    # Reconstruct the aligned sequences
    aligned_sequences = []
    for i in range(len(sequences)):
        aligned_sequence = ''
        for j in range(len(sequences[0])):
            if sequences[i][j] == sequences[0][j]:
                aligned_sequence += sequences[0][j]
            else:
                aligned_sequence += '-'
        aligned_sequences.append(aligned_sequence)
    
    return aligned_sequences

def close_point_midpoints(points: List[List[int]], distance_threshold: int) -> List[List[float]]:
    result = []
    for i in range(len(points)):
        for j in range(i + 1, len(points)):
            distance = math.sqrt((points[i][0] - points[j][0])**2 + (points[i][1] - points[j][1])**2)
            if distance <= distance_threshold:
                midpoint = [(points[i][0] + points[j][0]) / 2, (points[i][1] + points[j][1]) / 2]
                result.append(midpoint)
    
    return result

def keyword_analysis(text: str, keyword: str) -> Tuple[int, List[str]]:
    sentences = text.split('.')
    count = 0
    sentences_with_keyword = []
    
    for sentence in sentences:
        if keyword.lower() in sentence.lower():
            count += sentence.lower().count(keyword.lower())
            sentences_with_keyword.append(sentence.strip())
    
    return count, sentences_with_keyword

def kernighan_lin_partitioning(adjacency_matrix: np.ndarray, num_partitions: int) -> np.ndarray:
    num_vertices, _ = adjacency_matrix.shape
    partition = np.random.randint(0, num_partitions, num_vertices)
    cut_size = np.sum(adjacency_matrix[partition == 0, :] @ (partition == 1))
    for _ in range(100):
        swap_vertices = np.random.choice(num_vertices, size=2, replace=False)
        old_cut = np.sum(adjacency_matrix[partition == 0, :] @ (partition == 1))
        partition[swap_vertices] = (partition[swap_vertices] + 1) % num_partitions
        new_cut = np.sum(adjacency_matrix[partition == 0, :] @ (partition == 1))
        if new_cut > old_cut:
            partition[swap_vertices] = (partition[swap_vertices] - 1) % num_partitions
    return partition

def decode_variable_length_codes(binary_string: str, codes: Dict[str, str]) -> str:
    decoded_string = ""
    temp = ""
    
    for bit in binary_string:
        temp += bit
        if temp in codes:
            decoded_string += codes[temp]
            temp = ""
    
    if temp:  # If the binary string is not a valid code
        raise ValueError("Invalid binary string")
    
    return decoded_string

def is_sub_matrix_sum(matrix: List[List[int]], target: int) -> bool:
    rows, cols = len(matrix), len(matrix[0])
    prefix_sum = [[0] * (cols + 1) for _ in range(rows + 1)]
    
    for i in range(1, rows + 1):
        for j in range(1, cols + 1):
            prefix_sum[i][j] = prefix_sum[i-1][j] + prefix_sum[i][j-1] - prefix_sum[i-1][j-1] + matrix[i-1][j-1]
    
    for i in range(1, rows + 1):
        for j in range(1, cols + 1):
            for k in range(i, rows + 1):
                for end_col in range(j, cols + 1):
                    sub_matrix_sum = prefix_sum[k][end_col] - prefix_sum[k][j-1] - prefix_sum[i-1][end_col] + prefix_sum[i-1][j-1]
                    if sub_matrix_sum == target:
                        return True
    
    return False

def depth_first_search(tree: List[List[int]], node: int) -> List[int]:
    visited = []
    stack = [node]
    
    while stack:
        current_node = stack.pop()
        if current_node not in visited:
            visited.append(current_node)
            for child in reversed(tree[current_node]):
                stack.append(child)
    
    return visited

def betweenness_centrality(graph: Dict[int, List[int]], k: int) -> List[int]:
    G = nx.Graph()
    for node, neighbors in graph.items():
        G.add_node(node)
        for neighbor in neighbors:
            G.add_edge(node, neighbor)
    
    centrality = nx.betweenness_centrality(G)
    sorted_centralities = sorted(centrality.items(), key=lambda x: x[1], reverse=True)
    return [node for node, _ in sorted_centralities[:k]]

def longest_common_subsequence(matrix: list) -> list:
    rows, cols = len(matrix), len(matrix[0])
    dp = [[0] * (cols + 1) for _ in range(rows + 1)]
    lcs = []
    
    for i in range(1, rows + 1):
        for j in range(1, cols + 1):
            if matrix[i - 1][j - 1] in matrix[:i - 1]:
                k = matrix[:i - 1].index(matrix[i - 1][j - 1])
                dp[i][j] = dp[k][j - 1] + 1
            else:
                dp[i][j] = dp[i - 1][j]
    
    i, j = rows, cols
    while i > 0 and j > 0:
        if dp[i][j] != dp[i - 1][j]:
            lcs.append(matrix[i - 1][j - 1])
            i = matrix[:i - 1].index(matrix[i - 1][j - 1])
            j -= 1
        else:
            i -= 1
    
    return lcs[::-1]
```

File: string_optimizer.py:

```Python
from typing import List, Tuple
from typing import List
import numpy as np
import heapq
from collections import defaultdict
from typing import List, Tuple, Dict
import pandas as pd
from sklearn.decomposition import PCA
from sklearn.linear_model import LinearRegression
from sklearn.model_selection import train_test_split
from itertools import combinations

def largest_subgrid(matrix: List[List[int]], threshold: int) -> Tuple[Tuple[int, int], Tuple[int, int]]:
    rows, cols = len(matrix), len(matrix[0])
    dp = [[0] * cols for _ in range(rows)]
    max_size = 0
    max_coords = ((0, 0), (0, 0))
    
    for i in range(rows):
        for j in range(cols):
            if matrix[i][j] > threshold:
                dp[i][j] = 1
                if i > 0 and j > 0:
                    dp[i][j] = min(dp[i-1][j], dp[i][j-1], dp[i-1][j-1]) + 1
                if dp[i][j] > max_size:
                    max_size = dp[i][j]
                    max_coords = ((i - max_size + 1, j - max_size + 1), (i, j))
    
    return max_coords

def gaussian_elimination_solver(matrix: List[List[float]], vector: List[float]) -> List[float]:
    matrix = np.array(matrix, dtype=float)
    vector = np.array(vector, dtype=float)
    
    n = len(matrix)
    
    for i in range(n):
        # Partial pivoting
        max_el = abs(matrix[i][i])
        max_row = i
        for k in range(i+1, n):
            if abs(matrix[k][i]) > max_el:
                max_el = abs(matrix[k][i])
                max_row = k
        
        # Swap maximum row with current row
        matrix[[i, max_row]] = matrix[[max_row, i]]
        vector[[i, max_row]] = vector[[max_row, i]]
        
        # Make all rows below this one 0 in current column
        for k in range(i+1, n):
            c = -matrix[k][i]/matrix[i][i]
            for j in range(i, n):
                if i == j:
                    matrix[k][j] = 0
                else:
                    matrix[k][j] += c * matrix[i][j]
            vector[k] += c * vector[i]
    
    # Solve equation Ax=b for an upper triangular matrix A
    solution = [0 for _ in range(n)]
    for i in range(n-1, -1, -1):
        solution[i] = vector[i]/matrix[i][i]
        for k in range(i-1, -1, -1):
            vector[k] -= matrix[k][i] * solution[i]
    
    return solution

def lexicographically_smallest_string(string: str, k: int) -> str:
    char_count = {}
    
    for char in string:
        if char in char_count:
            char_count[char] += 1
        else:
            char_count[char] = 1
    
    max_heap = []
    
    for char, count in char_count.items():
        heapq.heappush(max_heap, (-ord(char), char, count))
    
    while k > 0 and max_heap:
        _, char, count = heapq.heappop(max_heap)
        
        if count <= k:
            k -= count
        else:
            char_count[char] -= k
            k = 0
    
    result = ""
    
    for char in sorted(char_count.keys()):
        result += char * char_count[char]
    
    return result

def anagram_substrings(s: str, n: int) -> List[str]:
    anagrams = defaultdict(list)
    for i in range(len(s) - n + 1):
        sorted_str = "".join(sorted(s[i:i + n]))
        anagrams[sorted_str].append(s[i:i + n])
        
    result = []
    for value in anagrams.values():
        if len(value) > 1:
            result.extend(value)
            
    return result

def event_scheduler(intervals, events):
    intervals.sort()
    events.sort(key=lambda x: x[0])
    scheduled_events = []
    
    for event in events:
        for interval in intervals:
            if interval[0] <= event[0] and interval[1] >= event[1]:
                scheduled_events.append(event)
                intervals.remove(interval)
                break
    
    return scheduled_events

def budget_tracker(transactions: List[Tuple[str, int, str]], budget: int) -> List[str]:
    categories = {}
    
    for date, amount, description in transactions:
        category = description.split(':')[0].strip()
        if category in categories:
            categories[category] += amount
        else:
            categories[category] = amount
    
    exceeded_categories = [category for category, amount in categories.items() if amount > budget]
    
    return exceeded_categories

def pca_linear_regression(df: pd.DataFrame, feature_columns: List[str], target_column: str) -> List[float]:
    X = df[feature_columns]
    y = df[target_column]
    
    pca = PCA(n_components=0.95)
    X_pca = pca.fit_transform(X)
    
    X_train, X_test, y_train, y_test = train_test_split(X_pca, y, test_size=0.2, random_state=42)
    
    model = LinearRegression()
    model.fit(X_train, y_train)
    
    predicted_values = model.predict(X_test)
    
    return predicted_values.tolist()

def schedule_non_overlapping_tasks(m, time_slots):
    time_slots.sort(key=lambda x: x[1])  # Sort by end time
    selected_slots = []
    last_end = -1
    
    for start, end in time_slots:
        if start >= last_end:
            selected_slots.append((start, end))
            last_end = end
            
    return selected_slots

def apply_box_blur(matrix: List[List[int]]) -> List[List[int]]:
    blurred_matrix = [[0 for _ in range(len(matrix[0]))] for _ in range(len(matrix))]
    
    for i in range(len(matrix)):
        for j in range(len(matrix[0])):
            total = 0
            count = 0
            for x in range(max(0, i-1), min(len(matrix), i+2)):
                for y in range(max(0, j-1), min(len(matrix[0]), j+2)):
                    total += matrix[x][y]
                    count += 1
            blurred_matrix[i][j] = total // count
    
    return blurred_matrix

def list_intersection(A: List[int], B: List[int]) -> List[int]:
    set_B = set(B)
    result = []
    for a in A:
        if a in set_B:
            result.append(a)
            set_B.remove(a)
    
    return result

def find_sequence_pairs(sequences: List[List[int]], target_sum: int) -> List[Tuple[int, int]]:
    sequence_sums = [sum(seq) for seq in sequences]
    pairs = set()
    for i, j in combinations(range(len(sequences)), 2):
        if sequence_sums[i] + sequence_sums[j] == target_sum:
            pairs.add(tuple(sorted((i, j))))
    return list(pairs)
```

File: min_bit_flips.py:

```Python
import numpy as np
from typing import List
from typing import Dict, List
from typing import List, Tuple
from typing import List, Dict
import math

def reduce_rank_with_svd(matrix: np.ndarray, k: int) -> np.ndarray:
    if k >= matrix.shape[1]:
        return matrix
    
    U, s, Vh = np.linalg.svd(matrix)
    Uk = U[:, :k]
    sk = np.diag(s[:k])
    Vk = Vh[:k, :]
    
    return Uk @ sk @ Vk

def max_subarray_sums(sequence: List[int], window_size: int) -> List[int]:
    if not sequence or window_size <= 0:
        return []
    
    max_sums = []
    current_sum = sum(sequence[:window_size])
    max_sums.append(current_sum)
    
    for i in range(window_size, len(sequence)):
        current_sum = current_sum - sequence[i - window_size] + sequence[i]
        max_sums.append(max(max_sums[-1], current_sum))
    
    return max_sums

def max_score_with_moves(matrix: List[List[int]], k: int) -> int:
    if not matrix or k >= len(matrix) * len(matrix[0]):
        return 0
    
    rows, cols = len(matrix), len(matrix[0])
    dp = [[0] * cols for _ in range(rows)]
    dp[0][0] = matrix[0][0]
    
    for _ in range(k):
        temp = [[0] * cols for _ in range(rows)]
        for i in range(rows):
            for j in range(cols):
                for di, dj in [(-1, 0), (1, 0), (0, -1), (0, 1)]:
                    ni, nj = i + di, j + dj
                    if 0 <= ni < rows and 0 <= nj < cols:
                        temp[i][j] = max(temp[i][j], dp[ni][nj] + matrix[i][j])
        dp = temp
    
    return max(dp[-1])

def divide_graph_into_communities(graph: Dict[int, List[int]], communities: int) -> Dict[int, int]:
    node_community = {}
    community_sizes = [0] * communities
    
    for node in graph:
        max_neighbors = 0
        community = 0
        for neighbor in graph[node]:
            if neighbor in node_community:
                if community_sizes[node_community[neighbor]] > max_neighbors:
                    max_neighbors = community_sizes[node_community[neighbor]]
                    community = node_community[neighbor]
        if community == 0:
            community = 0
            for i in range(1, communities):
                if community_sizes[i] < community_sizes[community]:
                    community = i
        node_community[node] = community
        community_sizes[community] += 1
    
    return node_community

def transform_string_case(string, transformations):
    if not string or not transformations:
        return string
    
    result = list(string)
    
    for transformation in transformations:
        if transformation == "upper":
            result = [char.upper() for char in result]
        elif transformation == "lower":
            result = [char.lower() for char in result]
    
    return "".join(result)

def find_pattern(strings: List[str], pattern: str) -> List[Tuple[int, int]]:
    result = []
    for i, string in enumerate(strings):
        dp = [[False] * (len(pattern) + 1) for _ in range(len(string) + 1)]
        dp[0][0] = True
        for j in range(1, len(pattern) + 1):
            if pattern[j-1] == '*':
                dp[0][j] = dp[0][j-1]
        
        for i in range(1, len(string) + 1):
            for j in range(1, len(pattern) + 1):
                if pattern[j-1] in {string[i-1], '?'}:
                    dp[i][j] = dp[i-1][j-1]
                elif pattern[j-1] == '*':
                    dp[i][j] = dp[i][j-1] or dp[i-1][j]
        
        for i in range(1, len(string) + 1):
            if dp[i][len(pattern)]:
                result.append((i-1, i-len(pattern)))
    
    return result

def is_prime(n: int) -> bool:
    if n <= 1:
        return False
    if n <= 3:
        return True
    if n % 2 == 0 or n % 3 == 0:
        return False
    i = 5
    while i * i <= n:
        if n % i == 0 or n % (i + 2) == 0:
            return False
        i += 6
    return True

def longest_increasing_subsequence(sequence: List[int]) -> int:
    if not sequence:
        return 0
    
    lis = [1] * len(sequence)  # Initialize LIS array
    
    for i in range(1, len(sequence)):
        for j in range(i):
            if sequence[i] > sequence[j]:
                lis[i] = max(lis[i], lis[j] + 1)
    
    return max(lis)

def min_bit_flips(bitstrings: List[str], target: str) -> (int, str):
    min_flips = float('inf')
    min_bitstring = ''
    
    for bitstring in bitstrings:
        flips = sum(el1 != el2 for el1, el2 in zip(bitstring, target))
        if flips < min_flips:
            min_flips = flips
            min_bitstring = bitstring
    
    return min_flips, min_bitstring

def evaluate_students(students: List[List[int]], threshold: int) -> Dict[int, str]:
    results = {}
    for i, student in enumerate(students):
        average_grade = sum(student) / len(student)
        if average_grade >= threshold:
            results[i] = "Pass"
        else:
            results[i] = "Fail"
    return results

def points_in_circle(points: List[Tuple[float, float]], r: float) -> List[Tuple[float, float]]:
    return [(x, y) for x, y in points if math.sqrt(x**2 + y**2) <= r]
```

File: binomial_coefficient.py:

```Python
from typing import List, Dict
from typing import List
import numpy as np
from typing import List, Tuple
from itertools import groupby
from collections import deque
import math

def find_overlapping_subsequences(sequences: List[str], min_length: int) -> Dict[str, int]:
    subsequences = {}
    
    for sequence in sequences:
        for i in range(len(sequence) - min_length + 1):
            subsequence = sequence[i:i + min_length]
            subsequences[subsequence] = subsequences.get(subsequence, 0) + 1
    
    return subsequences

def binomial_coefficient_calculator(n: int, m: int, k: int) -> List[List[int]]:
    coefficients = [[0] * (k + 1) for _ in range(m + 1)]
    
    for i in range(m + 1):
        coefficients[i][0] = 1
        coefficients[i][min(i, k)] = 1
    
    for i in range(1, m + 1):
        for j in range(1, min(i, k) + 1):
            coefficients[i][j] = coefficients[i - 1][j - 1] + coefficients[i - 1][j]
    
    return coefficients

def power_iteration(matrix: List[List[float]], k: int) -> List[float]:
    eigenvalues = []
    eigenvectors = []
    
    for _ in range(k):
        # Initialize a random vector
        vector = np.random.rand(len(matrix))
        
        # Normalize the vector
        vector /= np.linalg.norm(vector)
        
        # Perform power iteration
        for _ in range(100):
            vector = np.dot(matrix, vector)
            vector /= np.linalg.norm(vector)
        
        # Append the eigenvalue and eigenvector
        eigenvalues.append(np.dot(vector, np.dot(matrix, vector)) / np.dot(vector, vector))
        eigenvectors.append(vector)
        
        # Orthogonalize the vector using Gram-Schmidt process
        for i in range(len(eigenvalues) - 1):
            vector -= np.dot(eigenvectors[i], vector) * eigenvectors[i]
        vector /= np.linalg.norm(vector)
    
    return eigenvalues, eigenvectors

def markov_chain_simulator(matrix: List[List[float]], initial_state: List[float], steps: int) -> List[float]:
    state_probabilities = initial_state
    
    for _ in range(steps):
        state_probabilities = [sum([state_probabilities[j] * matrix[j][i] for j in range(len(state_probabilities))]) for i in range(len(state_probabilities))]
    
    return state_probabilities

def otsu_thresholding(image: List[List[int]], threshold: int) -> List[List[int]]:
    histogram = np.histogram(image, bins=256, range=(0, 256))[0]
    total_pixels = sum(histogram)
    
    sum_background = 0
    sum_foreground = sum(i * histogram[i] for i in range(256))
    count_background = 0
    count_foreground = total_pixels
    
    max_variance = 0
    optimal_threshold = 0
    for i in range(1, 256):
        count_background += histogram[i - 1]
        count_foreground -= histogram[i - 1]
        sum_background += (i - 1) * histogram[i - 1]
        sum_foreground -= i * histogram[i - 1]
        
        mean_background = sum_background / count_background
        mean_foreground = sum_foreground / count_foreground
        
        variance = count_background * count_foreground * (mean_background - mean_foreground) ** 2
        
        if variance > max_variance:
            max_variance = variance
            optimal_threshold = i
    
    segmented_image = [[1 if pixel > optimal_threshold else 0 for pixel in row] for row in image]
    
    return segmented_image

def stratified_random_sampling(population: List[int], sample_size: int) -> List[int]:
    population_array = np.array(population)
    quantiles = np.quantile(population_array, [0, 0.25, 0.5, 0.75, 1])
    sample = []
    
    for i in range(4):
        stratum = population_array[(population_array > quantiles[i]) & (population_array <= quantiles[i + 1])]
        stratum_sample_size = int(sample_size * len(stratum) / len(population))
        stratum_sample = np.random.choice(stratum, size=stratum_sample_size, replace=False)
        sample.extend(stratum_sample)
    
    return sample

def split_string(string: str) -> List[Tuple[str, str]]:
    groups = []
    for key, group in groupby(string, str.isdigit):
        groups.append(''.join(group))
    
    splits = []
    for i in range(len(groups)):
        if groups[i].isdigit():
            splits.append((groups[i], ''))
        else:
            splits.append((''.join(groups[:i]), groups[i]))
            splits.append((groups[i], ''.join(groups[i+1:])))
    
    return splits

def ngram_extraction(text: str, ngrams: int) -> List[List[str]]:
    words = text.split()
    padded_words = ['<SOS>'] * (ngrams - 1) + words + ['<EOS>'] * (ngrams - 1)
    
    ngrams_list = []
    for i in range(len(padded_words) - ngrams + 1):
        ngram = padded_words[i:i + ngrams]
        ngrams_list.append(ngram)
    
    return ngrams_list

def reachable_positions(grid: List[List[int]], k: int) -> List[tuple]:
    rows, cols = len(grid), len(grid[0])
    directions = [(0, 1), (0, -1), (1, 0), (-1, 0)]
    visited = set()
    queue = deque([(0, 0, 0)])  # (row, col, steps)
    reachable = []
    
    while queue:
        row, col, steps = queue.popleft()
        
        if steps > k:
            break
        
        if (row, col) not in visited:
            visited.add((row, col))
            reachable.append((row, col))
            
            for dr, dc in directions:
                r, c = row + dr, col + dc
                
                if 0 <= r < rows and 0 <= c < cols:
                    queue.append((r, c, steps + 1))
    
    return reachable

def find_k_nearest_points(points: List[Tuple[float, float]], k: int) -> List[Tuple[float, float]]:
    distances = [(math.sqrt(x**2 + y**2), (x, y)) for x, y in points]
    sorted_points = sorted(distances, key=lambda item: item[0])
    return [point[1] for point in sorted_points[:k]]

def trend_analysis(prices: List[float], n: int) -> Dict[str, int]:
    if len(prices) < n:
        return {"increasing": 0, "decreasing": 0, "stable": 0}
    
    trends = {"increasing": 0, "decreasing": 0, "stable": 0}
    
    for i in range(len(prices) - n):
        change = prices[i + n] - prices[i]
        if change > 0:
            trends["increasing"] += 1
        elif change < 0:
            trends["decreasing"] += 1
        else:
            trends["stable"] += 1
            
    return trends
```

File: string_operations.py:

```Python
from typing import Dict, List
from typing import List
from collections import deque
import random
from typing import List, Tuple
from sklearn.cluster import DBSCAN

def is_graph_traversable(graph: Dict[int, List[int]], start_node: int, visit_order: List[int]) -> bool:
    visited = set()
    for node in visit_order:
        if node not in graph:
            return False
        if node != start_node and node not in visited:
            return False
        for neighbor in graph[node]:
            if neighbor not in visited and neighbor != start_node:
                return False
        visited.add(node)
    return len(visited) == len(graph)

def rotate_sub_matrix(matrix: List[List[int]], row: int, col: int, size: int) -> List[List[int]]:
    if not matrix or size <= 0:
        return matrix
    
    for _ in range(4):
        for layer in range(size // 2):
            first, last = layer, size - layer - 1
            
            for i in range(first, last):
                top = matrix[layer + row][i + col]
                
                matrix[layer + row][i + col] = matrix[-i - 1 + row + size - 1][layer + col]
                matrix[-i - 1 + row + size - 1][layer + col] = matrix[-layer - 1 + row + size - 1][-i - 1 + col + size - 1]
                matrix[-layer - 1 + row + size - 1][-i - 1 + col + size - 1] = matrix[i + row][last + col]
                matrix[i + row][last + col] = top
                
    return matrix

def shortest_path_to_boundary(grid: List[List[int]], x: int, y: int) -> int:
    n, m = len(grid), len(grid[0])
    if x < 0 or x >= n or y < 0 or y >= m:
        raise ValueError("Cell is out of bounds")
    
    directions = [(0, 1), (0, -1), (1, 0), (-1, 0)]
    queue = deque([(x, y, 0)])
    visited = {(x, y)}
    
    while queue:
        current_x, current_y, distance = queue.popleft()
        
        if current_x == 0 or current_x == n-1 or current_y == 0 or current_y == m-1:
            return distance
        
        for dx, dy in directions:
            new_x, new_y = current_x + dx, current_y + dy
            
            if 0 <= new_x < n and 0 <= new_y < m and (new_x, new_y) not in visited:
                queue.append((new_x, new_y, distance + 1))
                visited.add((new_x, new_y))
    
    return -1

def rotate_string(s, n):
    n = n % len(s) if s else 0
    return s[n:] + s[:n]

def knapsack(items: List[List[int]], capacity: int) -> List[int]:
    n = len(items)
    dp = [[0] * (capacity + 1) for _ in range(n + 1)]
    
    for i in range(1, n + 1):
        weight, value = items[i - 1]
        
        for j in range(1, capacity + 1):
            if weight > j:
                dp[i][j] = dp[i - 1][j]
            else:
                dp[i][j] = max(dp[i - 1][j], dp[i - 1][j - weight] + value)
    
    selected_items = []
    i, j = n, capacity
    
    while i > 0 and j > 0:
        if dp[i][j] != dp[i - 1][j]:
            selected_items.append(i - 1)
            j -= items[i - 1][0]
        i -= 1
    
    return selected_items

def maximum_sum_path(triangle: List[List[int]]) -> List[int]:
    rows = len(triangle)
    dp = [[0] * len(row) for row in triangle]
    dp[0][0] = triangle[0][0]
    
    for i in range(1, rows):
        for j in range(len(triangle[i])):
            if j == 0:
                dp[i][j] = dp[i - 1][j] + triangle[i][j]
            elif j == len(triangle[i]) - 1:
                dp[i][j] = dp[i - 1][j - 1] + triangle[i][j]
            else:
                dp[i][j] = max(dp[i - 1][j - 1], dp[i - 1][j]) + triangle[i][j]
    
    max_sum = max(dp[-1])
    max_index = dp[-1].index(max_sum)
    max_path = [max_sum]
    for i in range(rows - 2, -1, -1):
        if max_index == 0:
            max_path.insert(0, dp[i][max_index])
            max_index = max_index
        elif max_index == len(triangle[i]) - 1:
            max_path.insert(0, dp[i][max_index - 1])
            max_index = max_index - 1
        else:
            if dp[i][max_index - 1] > dp[i][max_index]:
                max_path.insert(0, dp[i][max_index - 1])
                max_index = max_index - 1
            else:
                max_path.insert(0, dp[i][max_index])
                max_index = max_index
    
    return max_path

def word_segmentation(text: str, dictionary: List[str]) -> str:
    n = len(text)
    dp = [False] * (n + 1)
    dp[0] = True
    
    for i in range(1, n + 1):
        for j in range(i):
            if dp[j] and text[j:i] in dictionary:
                dp[i] = True
                break
    
    i = n
    result = []
    
    while i > 0:
        for j in range(i):
            if dp[j] and text[j:i] in dictionary:
                result.append(text[j:i])
                i = j
                break
    
    return ' '.join(result[::-1])

def knapsack_solver(items: List[str], capacity: int, profits: List[int]) -> List[str]:
    n = len(profits)
    dp = [[0 for _ in range(capacity + 1)] for _ in range(n + 1)]
    for i in range(1, n + 1):
        for w in range(1, capacity + 1):
            if w < i:
                dp[i][w] = dp[i - 1][w]
            else:
                dp[i][w] = max(dp[i - 1][w], profits[i - 1] + dp[i - 1][w - i])
    result = []
    w = capacity
    for i in range(n, 0, -1):
        if dp[i][w] != dp[i - 1][w]:
            result.append(items[i - 1])
            w -= i
    return result

def genetic_algorithm(population_size, generations, dna_length, fitness_function):
    population = [''.join(random.choice('01') for _ in range(dna_length)) for _ in range(population_size)]
    for _ in range(generations):
        fitnesses = [fitness_function(dna) for dna in population]
        fittest_indices = sorted(range(population_size), key=lambda i: fitnesses[i], reverse=True)[:population_size//2]
        selected_dnas = [population[i] for i in fittest_indices]
        offspring = []
        while len(offspring) < population_size:
            parent1, parent2 = random.sample(selected_dnas, 2)
            crossover_point = random.randint(1, dna_length-1)
            child1 = parent1[:crossover_point] + parent2[crossover_point:]
            child2 = parent2[:crossover_point] + parent1[crossover_point:]
            offspring.extend([child1, child2])
        for i in range(population_size):
            if random.random() < 0.1:  # 10% mutation rate
                mutation_point = random.randint(0, dna_length-1)
                offspring[i] = offspring[i][:mutation_point] + str(1-int(offspring[i][mutation_point])) + offspring[i][mutation_point+1:]
        population = offspring
    return max(population, key=fitness_function)

def cluster_points(points: List[Tuple[int, int]], threshold: int) -> List[List[Tuple[int, int]]]:
    clustering = DBSCAN(eps=threshold, min_samples=2).fit(points)
    labels = clustering.labels_
    clusters = [[] for _ in range(max(labels) + 1)]
    for i, label in enumerate(labels):
        clusters[label].append(points[i])
    return clusters

def porter_stemmer(sentences: List[str]) -> List[str]:
    if not sentences:
        return []
    
    stemmed_words = []
    for sentence in sentences:
        words = sentence.split()
        for word in words:
            # Remove prefixes
            if word.endswith('ing'):
                word = word[:-3]
            elif word.endswith('ed'):
                word = word[:-2]
            
            # Remove suffixes
            if word.endswith('ly'):
                word = word[:-2]
            
            stemmed_words.append(word.lower())
    
    return stemmed_words
```

File: moving_averages.py:

```Python
from typing import List
import random
from collections import Counter
from typing import List, Dict
import math
import heapq
from typing import List, Tuple

def moving_averages(sequence: List[int], window_size: int) -> List[float]:
    if window_size > len(sequence) or window_size <= 0:
        return []
    
    averages = []
    
    for i in range(len(sequence) - window_size + 1):
        window_sum = sum(sequence[i:i + window_size])
        average = window_sum / window_size
        averages.append(average)
        
    return averages

def pair_generator(num_pairs: int, max_num: int) -> List[List[int]]:
    if num_pairs > max_num * (max_num - 1) // 2:
        raise ValueError("num_pairs cannot be greater than the total possible pairs")
    
    pairs = set()
    while len(pairs) < num_pairs:
        pair = tuple(sorted((random.randint(1, max_num), random.randint(1, max_num))))
        if pair[0] != pair[1]:  # ensure the pair does not contain duplicate numbers
            pairs.add(pair)
    
    return [list(pair) for pair in pairs]

def can_sum_to_target(arr, target):
    sums = {0}
    
    for num in arr:
        new_sums = set()
        for s in sums:
            new_sum = s + num
            if new_sum == target:
                return True
            new_sums.add(new_sum)
        sums.update(new_sums)

    return False

def similar_vertices(graph: List[List[int]], start_vertex: int, k: int) -> List[int]:
    n = len(graph)
    similarity_scores = [0] * n
    similarity_scores[start_vertex] = float('inf')  # Start vertex is not similar to itself
    
    for vertex in range(n):
        if vertex != start_vertex:
            similarity_scores[vertex] = sum(graph[start_vertex][v] & graph[vertex][v] for v in range(n))
    
    top_k_vertices = sorted(range(n), key=lambda x: similarity_scores[x], reverse=True)[:k]
    
    return top_k_vertices

def product_subarrays(nums: List[int], k: int) -> List[List[int]]:
    threshold = sum(nums[k:])
    result = []
    for i in range(len(nums) - k + 1):
        subarray = nums[i:i + k]
        if len(set(subarray)) == k and subarray[0] != 0 and subarray[-1] != 0:
            subarray_product = 1
            for num in subarray:
                subarray_product *= num
            if subarray_product > threshold:
                result.append(subarray)
    return result

def best_clique(adj_matrix: List[List[int]], k: int) -> List[int]:
    if k > len(adj_matrix):
        return []
    
    best_clique_nodes = []
    max_density = 0
    
    for i in range(len(adj_matrix)):
        clique_nodes = [i]
        visited = [False] * len(adj_matrix)
        visited[i] = True
        
        while len(clique_nodes) < k:
            max_neighbors = -1
            next_node = None
            for j in range(len(adj_matrix)):
                if not visited[j] and sum(adj_matrix[j][n] for n in clique_nodes) > max_neighbors:
                    max_neighbors = sum(adj_matrix[j][n] for n in clique_nodes)
                    next_node = j
            if next_node is None:
                break
            clique_nodes.append(next_node)
            visited[next_node] = True
        
        if len(clique_nodes) == k:
            density = sum(adj_matrix[i][j] for i in clique_nodes for j in clique_nodes if i < j) / (k * (k - 1) / 2)
            if density > max_density:
                max_density = density
                best_clique_nodes = clique_nodes
    
    return best_clique_nodes

def can_construct_word(words, word):
    char_count = Counter()
    for w in words:
        char_count.update(w)  # Count occurrences of each character

    word_count = Counter(word)
    
    for char, count in word_count.items():
        if char_count[char] < count:  # Check availability against requested count
            return False
            
    return True

def total_tree_volume(trees: List[Dict[str, int]], max_height: int) -> float:
    total_volume = 0
    for tree in trees:
        if tree['height'] <= max_height:
            radius = tree['width'] / 2
            volume = math.pi * radius ** 2 * tree['height']
            total_volume += volume
    
    return total_volume

def are_parentheses_balanced(sequence: str) -> bool:
    stack = []
    mapping = {')': '(', '}': '{', ']': '['}
    
    for char in sequence:
        if char in mapping.values():
            stack.append(char)
        elif char in mapping.keys():
            if stack == [] or mapping[char] != stack.pop():
                return False
    
    return stack == []

def needleman_wunsch(sequences, gap_penalty):
    # Initialize scoring matrix
    scoring_matrix = [[0 for _ in range(len(sequences[1])+1)] for _ in range(len(sequences[0])+1)]
    
    # Initialize traceback matrix
    traceback_matrix = [[None for _ in range(len(sequences[1])+1)] for _ in range(len(sequences[0])+1)]
    
    # Initialize first row and column of scoring matrix
    for i in range(len(sequences[0])+1):
        scoring_matrix[i][0] = gap_penalty * i
    for j in range(len(sequences[1])+1):
        scoring_matrix[0][j] = gap_penalty * j
    
    # Fill in scoring matrix
    for i in range(1, len(sequences[0])+1):
        for j in range(1, len(sequences[1])+1):
            match = scoring_matrix[i-1][j-1] + (0 if sequences[0][i-1] == sequences[1][j-1] else -1)
            delete = scoring_matrix[i-1][j] + gap_penalty
            insert = scoring_matrix[i][j-1] + gap_penalty
            scoring_matrix[i][j] = max(match, delete, insert)
            if scoring_matrix[i][j] == match:
                traceback_matrix[i][j] = "match"
            elif scoring_matrix[i][j] == delete:
                traceback_matrix[i][j] = "delete"
            else:
                traceback_matrix[i][j] = "insert"
    
    # Trace back optimal alignment
    alignment = []
    i, j = len(sequences[0]), len(sequences[1])
    while i > 0 or j > 0:
        if traceback_matrix[i][j] == "match":
            alignment.append((sequences[0][i-1], sequences[1][j-1]))
            i -= 1
            j -= 1
        elif traceback_matrix[i][j] == "delete":
            alignment.append((sequences[0][i-1], "-"))
            i -= 1
        else:
            alignment.append(("-", sequences[1][j-1]))
            j -= 1
    
    return alignment[::-1]

def dijkstra_shortest_path(n: int, edges: List[Tuple[int, int, int]], start: int, end: int) -> Tuple[int, List[int]]:
    graph = {i: [] for i in range(n)}
    for u, v, w in edges:
        graph[u].append((v, w))
    
    min_heap = [(0, start)]
    visited = set()
    distances = {i: float('inf') for i in range(n)}
    distances[start] = 0
    parent = {start: None}
    
    while min_heap:
        current_distance, current_node = heapq.heappop(min_heap)
        if current_node in visited:
            continue
        visited.add(current_node)

        for neighbor, weight in graph[current_node]:
            distance = current_distance + weight
            if distance < distances[neighbor]:
                distances[neighbor] = distance
                parent[neighbor] = current_node
                heapq.heappush(min_heap, (distance, neighbor))

    if distances[end] == float('inf'):
        return -1, []

    path = []
    while end is not None:
        path.append(end)
        end = parent[end]
    
    return distances[path[0]], path[::-1]
```

File: event_overlap.py:

```Python
from typing import List, Tuple
from collections import Counter
from typing import List
import heapq
import re
from collections import defaultdict
from typing import Dict, List, Tuple

def filtered_word_count(words: List[str], min_length: int) -> List[Tuple[str, int]]:
    filtered_words = [word.lower() for word in words if len(word) >= min_length]
    word_counts = Counter(filtered_words)
    return sorted(word_counts.items(), key=lambda item: item[1], reverse=True)

def first_pair_sum(nums: List[int], target: int) -> int:
    num_set = set()
    for num in nums:
        if target - num in num_set:
            return 1
        num_set.add(num)
    return -1

def most_frequent_words(text: str, num_words: int) -> List[str]:
    words = re.findall(r'\b[a-zA-Z]{3,}\b', text.lower())
    word_freq = Counter(words)
    return heapq.nlargest(num_words, word_freq, key=word_freq.get)

def closest_pair_equal_elements(nums: List[int]) -> int:
    if len(nums) < 2:
        raise ValueError("List has less than two elements")
    
    nums.sort()
    min_diff = float('inf')
    
    for i in range(1, len(nums)):
        if nums[i] == nums[i - 1]:
            min_diff = min(min_diff, i - (i - 1))
    
    if min_diff == float('inf'):
        raise ValueError("No pairs of equal elements")
    
    return min_diff

def image_grayscaler(image, threshold):
    grayscale_image = []
    
    for row in image:
        grayscale_row = []
        
        for pixel in row:
            intensity = sum(pixel) // 3
            grayscale_pixel = [0, 0, 0] if intensity < threshold else [255, 255, 255]
            grayscale_row.append(grayscale_pixel)
        
        grayscale_image.append(grayscale_row)
    
    return grayscale_image

def find_busiest_airport(routes: List[Tuple[str, str]]) -> Tuple[str, List[str]]:
    graph = defaultdict(list)
    for departure, arrival in routes:
        graph[departure].append(arrival)
        graph[arrival].append(departure)
    
    busiest_airport = max(graph, key=lambda x: len(graph[x]))
    return busiest_airport, graph[busiest_airport]

def maximum_overlap(events: List[Tuple[int, int]]) -> int:
    points = []
    for start, end in events:
        points.append((start, 1))
        points.append((end, -1))
    
    points.sort()
    max_overlap = 0
    current_overlap = 0
    
    for _, delta in points:
        current_overlap += delta
        max_overlap = max(max_overlap, current_overlap)
    
    return max_overlap

def calculate_student_average_grades(student_grades: Dict[str, List[int]], threshold: int) -> Dict[str, Tuple[float, bool]]:
    result = {}
    
    for student, grades in student_grades.items():
        numeric_grades = [grade for grade in grades if isinstance(grade, (int, float))]
        if numeric_grades:
            average_grade = sum(numeric_grades) / len(numeric_grades)
            result[student] = (average_grade, average_grade >= threshold)
    
    return result

def join_strings_with_delimiter(lst: List[str], delimiter: str) -> str:
    return delimiter.join(lst)

def regex_matcher(pattern: str, strings: List[str]) -> List[bool]:
    compiled_pattern = re.compile(pattern)
    
    return [bool(compiled_pattern.fullmatch(string)) for string in strings]

def min_coins_for_change(coins: List[int], amount: int, max_coins: int) -> int:
    dp = [float('inf')] * (amount + 1)
    dp[0] = 0
    
    for coin in coins:
        for i in range(coin, amount + 1):
            dp[i] = min(dp[i], dp[i - coin] + 1)
            
    if dp[amount] > max_coins:
        return -1
    
    return dp[amount]
```

File: database_queries.py:

```Python
from typing import List
import numpy as np
from typing import List, Tuple
import heapq

def topological_sorter(graph: List[List[int]], start_vertex: int) -> List[int]:
    in_degree = [0] * len(graph)
    for i in range(len(graph)):
        for j in range(len(graph[i])):
            if graph[i][j] == 1:
                in_degree[j] += 1
    
    ordering = []
    queue = []
    for i in range(len(in_degree)):
        if in_degree[i] == 0:
            queue.append(i)
    
    while queue:
        vertex = queue.pop(0)
        ordering.append(vertex)
        for i in range(len(graph[vertex])):
            if graph[vertex][i] == 1:
                in_degree[i] -= 1
                if in_degree[i] == 0:
                    queue.append(i)
    
    if len(ordering) != len(graph):
        raise Exception("Cyclic dependency detected")
    
    return ordering

def svd_reconstruction(matrix, k):
    # Perform SVD on the matrix
    U, s, Vh = np.linalg.svd(matrix, full_matrices=False)
    
    # Retain only the top-k singular values and singular vectors
    Uk = U[:, :k]
    sk = s[:k]
    Vkh = Vh[:k, :]
    
    # Reconstruct the matrix from the retained singular values and singular vectors
    reconstructed_matrix = Uk @ np.diag(sk) @ Vkh
    
    return reconstructed_matrix

def transitive_closure(relations: List[List[str]], query: List[str]) -> List[List[int]]:
    num_entities = len(query)
    closure = [[0] * num_entities for _ in range(num_entities)]
    
    for i in range(num_entities):
        for j in range(num_entities):
            for relation in relations:
                if relation[0] == query[i] and relation[1] == query[j]:
                    closure[i][j] = 1
                    break
    
    for k in range(num_entities):
        for i in range(num_entities):
            for j in range(num_entities):
                if closure[i][k] and closure[k][j]:
                    closure[i][j] = 1
    
    return closure

def find_contiguous_subarrays(matrix: List[List[int]], target: int) -> List[Tuple[int, List[Tuple[int, int]]]]:
    result = []
    
    for i, row in enumerate(matrix):
        current_sum = 0
        start = 0
        subarrays = []
        
        for end in range(len(row)):
            current_sum += row[end]
            
            while current_sum > target and start <= end:
                current_sum -= row[start]
                start += 1
            
            if current_sum == target:
                subarrays.append((start, end))
        
        if subarrays:
            result.append((i, subarrays))
    
    return result

def sequence_variations(sequences: List[str], variations: int) -> List[str]:
    complements = {'A': 'T', 'T': 'A', 'G': 'C', 'C': 'G'}
    unique_variations = set(sequences)
    
    for _ in range(variations):
        new_variations = set()
        for sequence in unique_variations:
            for i in range(len(sequence)):
                for base, complement in complements.items():
                    new_sequence = sequence[:i] + complement + sequence[i+1:]
                    new_variations.add(new_sequence)
        unique_variations.update(new_variations)
        
    return list(unique_variations)

def largest_submatrix(matrix: List[List[int]], target: int) -> int:
    rows, cols = len(matrix), len(matrix[0])
    prefix_sum = [[0] * (cols + 1) for _ in range(rows + 1)]
    
    for i in range(1, rows + 1):
        for j in range(1, cols + 1):
            prefix_sum[i][j] = matrix[i - 1][j - 1] + prefix_sum[i - 1][j] + prefix_sum[i][j - 1] - prefix_sum[i - 1][j - 1]
    
    max_size = 0
    for i in range(rows):
        for j in range(cols):
            for k in range(i + 1, rows + 1):
                for end_col in range(j + 1, cols + 1):
                    submatrix_sum = prefix_sum[k][end_col] - prefix_sum[k][j] - prefix_sum[i][end_col] + prefix_sum[i][j]
                    if submatrix_sum <= target:
                        max_size = max(max_size, (k - i) * (end_col - j))
    
    return max_size

def moving_average_filter(series, window_size):
    filtered_series = []
    
    for i in range(len(series) - window_size + 1):
        window = series[i:i + window_size]
        avg = sum(window) / window_size
        filtered_series.append(avg)
    
    return filtered_series

def max_submatrix_sum_finder(matrix: List[List[int]], target_sum: int) -> Tuple[Tuple[int, int], Tuple[int, int]]:
    rows, cols = len(matrix), len(matrix[0])
    prefix_sum = [[0] * (cols + 1) for _ in range(rows + 1)]
    
    for i in range(1, rows + 1):
        for j in range(1, cols + 1):
            prefix_sum[i][j] = prefix_sum[i-1][j] + prefix_sum[i][j-1] - prefix_sum[i-1][j-1] + matrix[i-1][j-1]
    
    max_sum = float('-inf')
    top_left, bottom_right = None, None
    
    for i in range(1, rows + 1):
        for j in range(1, cols + 1):
            for k in range(i, rows + 1):
                for end_col in range(j, cols + 1):
                    submatrix_sum = prefix_sum[k][end_col] - prefix_sum[k][j-1] - prefix_sum[i-1][end_col] + prefix_sum[i-1][j-1]
                    if submatrix_sum <= target_sum and submatrix_sum > max_sum:
                        max_sum = submatrix_sum
                        top_left, bottom_right = (i-1, j-1), (k-1, end_col-1)
    
    return top_left, bottom_right

def calculate_total_sent(transactions: List[Tuple[str, str, int]], sender: str) -> int:
    total_sent = 0
    for transaction in transactions:
        if transaction[0] == sender:
            total_sent += transaction[2]
    return total_sent

def furthest_building(heights: List[int], bricks: List[int], ladders: int) -> int:
    heap = []
    total_bricks_used = 0
    
    for i in range(len(heights) - 1):
        brick_height = heights[i + 1] - heights[i]
        if brick_height > 0:
            heapq.heappush(heap, brick_height)
            total_bricks_used += brick_height
            
            if len(heap) > ladders:
                total_bricks_used -= heapq.heappop(heap)
                if total_bricks_used > bricks:
                    return i
                
    return len(heights) - 1

def is_valid_parentheses(s: str) -> bool:
    stack = []
    for char in s:
        if char == '(':
            stack.append(char)
        elif char == ')':
            if not stack:
                return False
            stack.pop()
        elif char not in ['(', ')']:
            return False
    
    return not stack
```

--------------------------------------------------------------------------------------------------

Problem Statement: Parameters:
- matrix: List[List[int]] # A 2D list of integers representing the input matrix to search for the target.
- target: int # The target integer to search for in the matrix.
- graph: List[List[int]] # A list of edges representing the graph for finding the median connected component.
- vertices: int # The number of vertices in the graph.
- binary_string: str # A binary string that will be decoded using variable-length codes.
- codes: Dict[str, str] # A dictionary of variable-length codes and their corresponding characters.
- bitstrings: List[str] # A list of bitstrings to calculate the minimum number of flips required to transform into the target bitstring.
- target_bitstring: str # The target bitstring for comparison to the list of bitstrings.

Objectives:
- Implement a search algorithm that utilizes the parameters matrix and target to find the position of the target. Capture the row and column indices as the output position.
- Based on the output position from the search algorithm, if the target is found, invoke another function using graph and vertices to compute the median connected component from the graph. Capture the median subgraphs formed as output.
- Decode the binary_string using the codes parameter to obtain a meaningful string. Handle possible decoding errors and ensure to return "Invalid code" in such cases.
- Calculate the minimum number of bit flips needed to transform each string in bitstrings to the target_bitstring using Hamming distance. Store the minimum flips and the corresponding bitstring.
- Aggregating the results from the previous goals, determine if the decoded string is present in the bitstring that requires the least number of flips. Track whether it exists and output this as a boolean result.
- Compile all obtained results into a structured format including the position, the median subgraphs, the decoded string, the minimum flips, and the existence of the decoded string in the transformed bitstring.

Return Values:
- position: Tuple[int, int] # The position (row index, column index) of the target in the matrix or (-1, -1) if not found.
- median_subgraphs: List[List[List[int]]] # The median subgraphs resulting from the median connected component.
- decoded_string: str # The meaningful string obtained from decoding the binary string.
- min_flips: int # The minimum number of bit flips required to transform the chosen bitstring to the target.
- min_bitstring: str # The bitstring that requires the minimum flips.
- exists: bool # A boolean indicating whether the decoded string exists in the bitstring that received the minimum flips.

The name of the function you create should be complex_algorithm

--------------------------------------------------------------------------------------------------

Answer Code:
def complex_algorithm(matrix: List[List[int]], target: int, graph: List[List[int]], vertices: int,
                      binary_string: str, codes: Dict[str, str], bitstrings: List[str], target_bitstring: str) -> Tuple[Tuple[int, int], List[List[List[int]]], str, int, str, bool]:
    # Step 1: Search for the target in the matrix
    position = search_matrix(matrix, target)
    
    median_subgraphs = []
    decoded_string = ""
    min_flips = 0
    min_bitstring = ""
    exists = False
    # Step 2: If the target is found, compute the median component
    if position != (-1, -1):
        median_subgraphs = median_component(graph, vertices)
    # Step 3: Decode the binary string using the provided variable-length codes
    try:
        decoded_string = decode_variable_length_codes(binary_string, codes)
    except ValueError:
        decoded_string = "Invalid code"
    # Step 4: Calculate the minimum bit flips
    min_flips, min_bitstring = min_bit_flips(bitstrings, target_bitstring)
    # Step 5: Check if the decoded string is in the selected bitstring
    exists = decoded_string in min_bitstring
    # Return the results as a structured tuple
    return position, median_subgraphs, decoded_string, min_flips, min_bitstring, exists

--------------------------------------------------------------------------------------------------

Test Code:
# Import statements if required
from typing import List, Tuple, Dict

# Import function from file
from complex_processing import complex_algorithm

# Initialize input parameters
matrix = [[1, 2, 3], [4, 5, 6], [7, 8, 9]]
target = 5
graph = [[0, 1], [1, 2], [2, 0], [1, 3]]  # Edges in the graph
vertices = 4
binary_string = "101110"
codes = {"10": "A", "111": "B", "00": "C"}
bitstrings = ["001", "111", "101"]
target_bitstring = "110"

# Call function with input parameters
return_position, return_median_subgraphs, return_decoded_string, return_min_flips, return_min_bitstring, return_exists = complex_algorithm(matrix, target, graph, vertices, binary_string, codes, bitstrings, target_bitstring)

# Step-by-step run-through of function to obtain intermediate outputs:

# Step 1
# Explanation: Search for the target in the matrix
position = (-1, -1)
if matrix and matrix[0]:
    rows, cols = len(matrix), len(matrix[0])
    row, col = 0, cols - 1
    while row < rows and col >= 0:
        current = matrix[row][col]
        if current == target:
            position = (row, col)
            break
        elif current > target:
            col -= 1  # Move left
        else:
            row += 1  # Move down

# Step 2
# Explanation: If the target is found, compute the median component
median_subgraphs = []
if position != (-1, -1):
    total_distance = 0
    distance_matrix = [[float('inf')] * vertices for _ in range(vertices)]
    
    for i in range(vertices):
        distance_matrix[i][i] = 0
    
    for u, v in graph:
        distance_matrix[u][v] = distance_matrix[v][u] = 1

    for k in range(vertices):
        for i in range(vertices):
            for j in range(vertices):
                distance_matrix[i][j] = min(distance_matrix[i][j], distance_matrix[i][k] + distance_matrix[k][j])
                if distance_matrix[i][j] != float('inf'):
                    total_distance += distance_matrix[i][j]
    
    median_distance = total_distance // (vertices * (vertices - 1) // 2)
    
    visited = [False] * vertices
    median_component = []
    subgraph1 = []
    subgraph2 = []
    
    for start in range(vertices):
        if not visited[start]:
            queue = [start]
            visited[start] = True
            subgraph = [start]
            
            while queue:
                node = queue.pop(0)
                for neighbor, edge_length in enumerate(distance_matrix[node]):
                    if edge_length == median_distance and not visited[neighbor]:
                        queue.append(neighbor)
                        visited[neighbor] = True
                        subgraph.append(neighbor)
            
            median_component.append(subgraph)
            if len(subgraph) > len(median_component[0]):
                subgraph1 = median_component[0]
                median_component[0] = subgraph
            else:
                subgraph2 = subgraph

# Step 3
# Explanation: Decode the binary string using the provided variable-length codes
decoded_string = ""
temp = ""
for bit in binary_string:
    temp += bit
    if temp in codes:
        decoded_string += codes[temp]
        temp = ""

if temp:  # If the binary string is not a valid code
    decoded_string = "Invalid code"

# Step 4
# Explanation: Calculate the minimum bit flips
min_flips = float('inf')
min_bitstring = ''

for bitstring in bitstrings:
    flips = sum(el1 != el2 for el1, el2 in zip(bitstring, target_bitstring))
    if flips < min_flips:
        min_flips = flips
        min_bitstring = bitstring

# Step 5
# Explanation: Check if the decoded string is in the selected bitstring
exists = decoded_string in min_bitstring

# Final Expected Output:
correct_position = position
correct_median_subgraphs = [subgraph1, subgraph2]
correct_decoded_string = decoded_string
correct_min_flips = min_flips
correct_min_bitstring = min_bitstring
correct_exists = exists

# Assert statements (compulsory) to check if the function returns the correct values:
assert return_position == correct_position
assert return_median_subgraphs == correct_median_subgraphs
assert return_decoded_string == correct_decoded_string
assert return_min_flips == correct_min_flips
assert return_min_bitstring == correct_min_bitstring
assert return_exists == correct_exists

print('All-Pass')

--------------------------------------------------------------------------------------------------

