Question No: 4
Context Size: 16558

Codebase:

File: substring_frequencies.py:

```Python
from collections import Counter
from typing import List, Tuple
from typing import Dict
from collections import defaultdict
from typing import List
from typing import List, Optional

def analyze_integer_frequencies(n, elements):
    frequency = Counter(elements)
    duplicates = sorted([x for x, count in frequency.items() if count > 1])
    unique_frequencies = {x: frequency[x] for x in duplicates}
    return unique_frequencies

def find_overlapping_rectangles(rectangles: List[Tuple[int, int, int, int]]) -> List[Tuple[Tuple[int, int, int, int], Tuple[int, int, int, int]]]:
    events = []
    
    for x, y, w, h in rectangles:
        events.append((x, 1, (x, y, w, h)))
        events.append((x + w, -1, (x, y, w, h)))
    
    events.sort()
    
    active_rectangles = []
    overlapping_pairs = []
    
    for x, delta, rectangle in events:
        if delta == 1:
            active_rectangles.append(rectangle)
        else:
            active_rectangles.remove(rectangle)
        
        for other in active_rectangles:
            if (rectangle[0] < other[0] + other[2] and
                rectangle[0] + rectangle[2] > other[0] and
                rectangle[1] < other[1] + other[3] and
                rectangle[1] + rectangle[3] > other[1]):
                overlapping_pairs.append((rectangle, other))
    
    return overlapping_pairs

def common_substrings(sequence: str, k: int, threshold: float) -> Dict[str, int]:
    frequencies = defaultdict(int)
    
    for i in range(len(sequence) - k + 1):
        substring = sequence[i:i+k]
        frequencies[substring] += 1
    
    common_substrings = {substring: frequency for substring, frequency in frequencies.items() if frequency / len(sequence) >= threshold}
    
    return common_substrings

def prefix_tree(text: str) -> Dict[str, Dict[str, str]]:
    prefix_tree_dict = {}
    
    words = text.split()
    
    for word in words:
        node = prefix_tree_dict
        
        for char in word:
            if char not in node:
                node[char] = {}
            node = node[char]
        
        node['$'] = word
    
    return prefix_tree_dict

def filter_unique_words(words: List[str], length: int) -> List[str]:
    seen = set()
    unique_words = []
    
    for word in words:
        if len(word) == length and word not in seen:
            unique_words.append(word)
            seen.add(word)
    
    return unique_words

def word_segmentation(text: str, dictionary: List[str]) -> str:
    n = len(text)
    dp = [False] * (n + 1)
    dp[0] = True
    
    for i in range(1, n + 1):
        for j in range(i):
            if dp[j] and text[j:i] in dictionary:
                dp[i] = True
                break
    
    i = n
    result = []
    
    while i > 0:
        for j in range(i):
            if dp[j] and text[j:i] in dictionary:
                result.append(text[j:i])
                i = j
                break
    
    return ' '.join(result[::-1])

def calculate_prefix_sums(data: List[int], threshold: int) -> List[int]:
    prefix_sums = []
    current_sum = 0
    
    for num in data:
        current_sum += num
        prefix_sums.append(current_sum)
    
    return [sum for sum in prefix_sums if sum > threshold]

def shortest_terrain_path(matrix: List[List[int]], start_position: Tuple[int, int], end_position: Tuple[int, int]) -> List[Tuple[int, int]]:
    rows, cols = len(matrix), len(matrix[0])
    directions = [(0, 1), (0, -1), (1, 0), (-1, 0)]
    queue = [(start_position, [start_position], 0)]
    visited = set()
    
    while queue:
        (x, y), path, elevation_change = queue.pop(0)
        visited.add((x, y))
        
        if (x, y) == end_position:
            return path
        
        for dx, dy in directions:
            nx, ny = x + dx, y + dy
            
            if 0 <= nx < rows and 0 <= ny < cols and (nx, ny) not in visited:
                new_elevation_change = elevation_change + abs(matrix[nx][ny] - matrix[x][y])
                queue.append(((nx, ny), path + [(nx, ny)], new_elevation_change))
    
    return []

def submatrix_sums(matrix: List[List[int]], k: int) -> List[Tuple[Tuple[int, int], int]]:
    rows, cols = len(matrix), len(matrix[0])
    sums = []
    
    for i in range(rows - k + 1):
        for j in range(cols - k + 1):
            submatrix_sum = sum(matrix[x][y] for x in range(i, i + k) for y in range(j, j + k))
            sums.append(((i, j), submatrix_sum))
    
    return sums

def knapsack_solver(items: List[str], capacity: int, profits: List[int]) -> List[str]:
    n = len(profits)
    dp = [[0 for _ in range(capacity + 1)] for _ in range(n + 1)]
    for i in range(1, n + 1):
        for w in range(1, capacity + 1):
            if w < i:
                dp[i][w] = dp[i - 1][w]
            else:
                dp[i][w] = max(dp[i - 1][w], profits[i - 1] + dp[i - 1][w - i])
    result = []
    w = capacity
    for i in range(n, 0, -1):
        if dp[i][w] != dp[i - 1][w]:
            result.append(items[i - 1])
            w -= i
    return result

def calculate_median(numbers: List[int], threshold: int) -> Optional[int]:
    if not numbers:
        return None
    
    sorted_numbers = sorted(numbers)
    n = len(sorted_numbers)
    
    if n % 2 == 0:
        median = (sorted_numbers[n // 2 - 1] + sorted_numbers[n // 2]) / 2
    else:
        median = sorted_numbers[n // 2]
    
    return median if median >= threshold else None
```

File: triplet_sum_finder.py:

```Python
from typing import List
import itertools
from typing import List, Tuple
from typing import Dict, List, Tuple
from typing import List, Optional
from typing import Dict, List

def shortest_concatenated_string(strings: List[str], max_length: int, target_string: str) -> str:
    concatenated_string = ""
    
    for string in strings:
        if target_string in string and len(concatenated_string) + len(string) <= max_length:
            concatenated_string += string
            break
        elif len(concatenated_string) + len(string) <= max_length:
            concatenated_string += string
    
    return concatenated_string

def combinations_above_average(arr: List[int], size: int) -> List[List[int]]:
    combs = list(itertools.combinations(arr, size))
    average = sum(sum(comb) for comb in combs) / len(combs) if combs else 0
    return [list(comb) for comb in combs if sum(comb) > average]

def scheduler(tasks: List[Tuple[int, int]], k: int) -> int:
    tasks.sort(key=lambda x: x[1])
    computers = [0] * k
    
    for duration, _ in tasks:
        min_computer = computers.index(min(computers))
        computers[min_computer] += duration
        
    return max(computers)

def calculate_student_average_grades(student_grades: Dict[str, List[int]], threshold: int) -> Dict[str, Tuple[float, bool]]:
    result = {}
    
    for student, grades in student_grades.items():
        numeric_grades = [grade for grade in grades if isinstance(grade, (int, float))]
        if numeric_grades:
            average_grade = sum(numeric_grades) / len(numeric_grades)
            result[student] = (average_grade, average_grade >= threshold)
    
    return result

def find_kth_largest(numbers: List[int], k: int) -> Optional[int]:
    unique_numbers = list(set(numbers))
    
    if k > len(unique_numbers):
        return None
    
    unique_numbers.sort(reverse=True)
    return unique_numbers[k - 1]  # k-th largest is at k-1 index

def binomial_coefficient_calculator(n: int, m: int, k: int) -> List[List[int]]:
    coefficients = [[0] * (k + 1) for _ in range(m + 1)]
    
    for i in range(m + 1):
        coefficients[i][0] = 1
        coefficients[i][min(i, k)] = 1
    
    for i in range(1, m + 1):
        for j in range(1, min(i, k) + 1):
            coefficients[i][j] = coefficients[i - 1][j - 1] + coefficients[i - 1][j]
    
    return coefficients

def independent_cascade(network, seed_nodes, influence_probability):
    active_nodes = set(seed_nodes)
    time_steps = [len(active_nodes)]
    
    while True:
        new_active_nodes = set()
        for node in active_nodes:
            for neighbor in network[node]:
                if neighbor not in active_nodes and np.random.rand() < influence_probability:
                    new_active_nodes.add(neighbor)
        active_nodes.update(new_active_nodes)
        time_steps.append(len(active_nodes))
        
        if not new_active_nodes:
            break
    
    return time_steps

def gins_subgraph(network: Dict[str, List[str]], nodes: List[str]) -> Dict[str, List[str]]:
    subgraph = {node: [] for node in nodes}
    for node in nodes:
        for neighbor in network[node]:
            if neighbor in nodes:
                subgraph[node].append(neighbor)
    
    return subgraph

def modular_product(numbers: List[int], modulus: int) -> int:
    if not numbers:
        return 1
    
    product = 1
    for number in numbers:
        product = (product * number) % modulus
        
    return product

def closest_triplet_sum(n: int, arr: List[int], x: int) -> List[int]:
    arr.sort()
    closest_sum = float('inf')
    result = []

    for i in range(n - 2):
        left, right = i + 1, n - 1 

        while left < right:
            current_sum = arr[i] + arr[left] + arr[right]

            if abs(current_sum - x) < abs(closest_sum - x):
                closest_sum = current_sum
                result = [arr[i], arr[left], arr[right]]

            if current_sum < x:
                left += 1
            elif current_sum > x:
                right -= 1
            else:
                return [arr[i], arr[left], arr[right]]

    return result

def optimal_schedule(schedule: List[List[int]], available: List[int]) -> List[List[int]]:
    schedule.sort(key=lambda x: x[1])
    optimal = []
    last_end = -1
    
    for task in schedule:
        if task[0] >= last_end and task[1] <= available[0]:
            optimal.append(task)
            last_end = task[1]
            available[0] -= task[1] - task[0]
    
    return optimal
```

File: statistical_analyzer.py:

```Python
from typing import List
import numpy as np
from typing import Dict, List
from typing import List, Dict, Set
from typing import List, Tuple
from typing import List, Optional
import random
from typing import List, Dict
import statistics
import math
from sklearn.cluster import DBSCAN

def image_convolution(data: List[List[int]], kernel_size: int) -> List[List[int]]:
    # Normalize the input image
    normalized_data = np.array(data) / max(max(row) for row in data) * 255
    
    # Define the kernel
    kernel = np.ones((kernel_size, kernel_size)) / kernel_size ** 2
    
    # Perform convolution operation
    convolved_data = np.zeros(normalized_data.shape)
    for i in range(normalized_data.shape[0] - kernel_size + 1):
        for j in range(normalized_data.shape[1] - kernel_size + 1):
            convolved_data[i, j] = np.sum(normalized_data[i:i+kernel_size, j:j+kernel_size] * kernel)
    
    # Apply max pooling operation
    pooled_data = np.zeros((convolved_data.shape[0] // 2, convolved_data.shape[1] // 2))
    for i in range(pooled_data.shape[0]):
        for j in range(pooled_data.shape[1]):
            pooled_data[i, j] = np.max(convolved_data[i*2:i*2+2, j*2:j*2+2])
    
    return pooled_data.tolist()

def max_island_area(grid: List[List[int]], row: int, col: int) -> int:
    if not grid or row < 0 or row >= len(grid) or col < 0 or col >= len(grid[0]) or grid[row][col] == 0:
        return 0
    
    grid[row][col] = 0
    area = 1
    
    area += max_island_area(grid, row - 1, col)
    area += max_island_area(grid, row + 1, col)
    area += max_island_area(grid, row, col - 1)
    area += max_island_area(grid, row, col + 1)
    
    return area

def dfs_search(graph: Dict[str, List[str]], start_node: str, end_node: str) -> List[str]:
    visited = set()
    stack = [(start_node, [start_node])]
    
    while stack:
        node, path = stack.pop()
        if node == end_node:
            return path
        if node not in visited:
            visited.add(node)
            for neighbor in graph[node]:
                stack.append((neighbor, path + [neighbor]))
    
    return []

def travelling_salesman(routes: List[List[int]], distances: List[List[int]]) -> List[int]:
    if not routes or not distances:
        return []
    
    num_cities = len(distances)
    visited = [False] * num_cities
    current_city = 0
    route = [current_city]
    visited[current_city] = True
    
    for _ in range(num_cities - 1):
        min_distance = float('inf')
        next_city = None
        for i in range(num_cities):
            if not visited[i] and distances[current_city][i] < min_distance:
                min_distance = distances[current_city][i]
                next_city = i
        route.append(next_city)
        visited[next_city] = True
        current_city = next_city
    
    route.append(route[0])
    return route

def dfs_traversal(matrix: List[List[int]], row: int, col: int) -> Dict[str, object]:
    visited = set()
    parent = {}
    stack = [(row, col, None)]
    
    while stack:
        current_row, current_col, parent_node = stack.pop()
        
        if (current_row, current_col) not in visited:
            visited.add((current_row, current_col))
            parent[(current_row, current_col)] = parent_node
            
            for neighbor_row, neighbor_col in [(current_row - 1, current_col), (current_row + 1, current_col), (current_row, current_col - 1), (current_row, current_col + 1)]:
                if 0 <= neighbor_row < len(matrix) and 0 <= neighbor_col < len(matrix[0]):
                    stack.append((neighbor_row, neighbor_col, (current_row, current_col)))
    
    return {"visited": visited, "parent": parent}

def find_pattern(strings: List[str], pattern: str) -> List[Tuple[int, int]]:
    result = []
    for i, string in enumerate(strings):
        dp = [[False] * (len(pattern) + 1) for _ in range(len(string) + 1)]
        dp[0][0] = True
        for j in range(1, len(pattern) + 1):
            if pattern[j-1] == '*':
                dp[0][j] = dp[0][j-1]
        
        for i in range(1, len(string) + 1):
            for j in range(1, len(pattern) + 1):
                if pattern[j-1] in {string[i-1], '?'}:
                    dp[i][j] = dp[i-1][j-1]
                elif pattern[j-1] == '*':
                    dp[i][j] = dp[i][j-1] or dp[i-1][j]
        
        for i in range(1, len(string) + 1):
            if dp[i][len(pattern)]:
                result.append((i-1, i-len(pattern)))
    
    return result

def max_average_subarray(nums: List[int], k: int) -> Optional[float]:
    if len(nums) < k:
        return None
    current_sum = sum(nums[:k])
    max_sum = current_sum
    
    for i in range(k, len(nums)):
        current_sum += nums[i] - nums[i - k]
        max_sum = max(max_sum, current_sum)
    
    return max_sum / k

def longest_suffix_concat(strings: List[str], separators: List[str]) -> str:
    if not strings:
        return ""
    
    min_length = min(len(s) for s in strings)
    longest_suffix = ""
    
    for i in range(1, min_length + 1):
        suffix = strings[0][-i:]
        if all(s.endswith(suffix) for s in strings):
            longest_suffix = suffix
        else:
            break
    
    combined = ""
    separator_index = 0
    
    for i, string in enumerate(strings):
        combined += string + separators[separator_index]
        separator_index = (separator_index + 1) % len(separators)
    
    combined = combined[:-1]  # Remove the last separator
    
    lines = []
    line = ""
    
    for char in combined:
        if len(line) + len(longest_suffix) > 10:
            lines.append(line)
            line = ""
        line += char
    
    lines.append(line)
    
    return "\n".join(lines)

def perception_clustering(perceptions: List[List[float]], clusters: int) -> (List[int], List[List[float]]):
    centroids = random.sample(perceptions, clusters)
    cluster_assignments = [0] * len(perceptions)
    
    while True:
        # Assign each perception to the closest centroid
        for i, perception in enumerate(perceptions):
            min_distance = float('inf')
            for j, centroid in enumerate(centroids):
                distance = np.linalg.norm(np.array(perception) - np.array(centroid))
                if distance < min_distance:
                    min_distance = distance
                    cluster_assignments[i] = j
        
        # Update the centroids
        new_centroids = []
        for i in range(clusters):
            cluster_perceptions = [perception for j, perception in enumerate(perceptions) if cluster_assignments[j] == i]
            if cluster_perceptions:
                centroid = np.mean(cluster_perceptions, axis=0).tolist()
                new_centroids.append(centroid)
        
        # Check for convergence
        if np.all(np.array(centroids) == np.array(new_centroids)):
            break
        
        centroids = new_centroids
    
    return cluster_assignments, centroids

def calculate_statistics(numbers: List[float], precision: int, stats: List[str]) -> Dict[str, float]:
    results = {}
    for stat in stats:
        if stat == "mean":
            results["mean"] = round(statistics.mean(numbers), precision)
        elif stat == "median":
            results["median"] = round(statistics.median(numbers), precision)
        elif stat == "mode":
            results["mode"] = round(statistics.mode(numbers), precision)
        elif stat == "standard_deviation":
            results["standard_deviation"] = round(math.sqrt(sum((x - statistics.mean(numbers)) ** 2 for x in numbers) / len(numbers)), precision)
    return results

def transaction_clusterer(data: List[List[float]], k: int, threshold: float) -> Dict[int, float]:
    db = DBSCAN(eps=threshold, min_samples=k).fit(data)
    labels = db.labels_
    
    result = {}
    for i in set(labels):
        if i != -1:
            cluster_points = [data[j] for j in range(len(data)) if labels[j] == i]
            avg_distance = np.mean([np.linalg.norm(np.array(cluster_points[j]) - np.array(cluster_points[j-1])) for j in range(1, len(cluster_points))])
            result[i] = avg_distance
    
    return result
```

File: stone_removal.py:

```Python
from typing import List, Dict
from collections import Counter
from typing import List
import numpy as np
from typing import List, Tuple
import random
import heapq

def analyze_strings(strings: List[str], substring: str) -> Dict[str, Dict[str, int]]:
    filtered_strings = [string for string in strings if substring in string]
    remaining_strings = [string for string in strings if substring not in string]
    
    filtered_frequency = Counter(''.join(filtered_strings))
    remaining_frequency = Counter(''.join(remaining_strings))
    
    return {"filtered_frequency": dict(filtered_frequency), "remaining_frequency": dict(remaining_frequency)}

def search_in_sorted_matrix(matrix: List[List[int]], target: int) -> bool:
    if not matrix or not matrix[0]:
        return False
    
    rows, cols = len(matrix), len(matrix[0])
    r, c = 0, cols - 1
    
    while r < rows and c >= 0:
        if matrix[r][c] == target:
            return True
        elif matrix[r][c] > target:
            c -= 1
        else:
            r += 1
            
    return False

def convolve_image(image: np.ndarray, kernel: np.ndarray) -> np.ndarray:
    image_height, image_width = image.shape
    kernel_height, kernel_width = kernel.shape
    feature_map = np.zeros((image_height - kernel_height + 1, image_width - kernel_width + 1))
    
    for i in range(image_height - kernel_height + 1):
        for j in range(image_width - kernel_width + 1):
            patch = image[i:i+kernel_height, j:j+kernel_width]
            feature_map[i, j] = np.sum(patch * kernel)
    
    return feature_map

def generate_permutations(s: str) -> List[str]:
    from itertools import permutations
    
    unique_permutations = set(permutations(s))
    sorted_permutations = sorted(''.join(p) for p in unique_permutations)
    
    return sorted_permutations

def approximate_numbers(numbers: List[float], max_error: float) -> List[int]:
    total_error = 0
    approximated_numbers = []
    
    for number in numbers:
        approximated_number = round(number)
        error = abs(number - approximated_number)
        if total_error + error <= max_error:
            total_error += error
            approximated_numbers.append(approximated_number)
        else:
            # Find the closest integer that minimizes the error
            lower_error = abs(number - (approximated_number - 1))
            upper_error = abs(number - (approximated_number + 1))
            if lower_error < upper_error:
                approximated_numbers.append(approximated_number - 1)
            else:
                approximated_numbers.append(approximated_number + 1)
    
    return approximated_numbers

def filter_and_transform(strings: List[str], threshold: int) -> List[Tuple[str, str]]:
    transformed = []
    for s in strings:
        if len(s) > threshold:
            transformed.append((s, s[::-1].upper()))
    return transformed

def extract_palindromic_words(text: str, min_length: int) -> List[str]:
    words = text.split()
    palindromes = {word for word in words if word.lower() == word[::-1].lower() and len(word) >= min_length}
    return sorted(palindromes)

def randomized_submatrix_selection(matrix: List[List[int]], rows: int, cols: int) -> List[List[int]]:
    non_zero_rows = [i for i, row in enumerate(matrix) if any(element != 0 for element in row)]
    non_zero_cols = [j for j in range(len(matrix[0])) if any(matrix[i][j] != 0 for i in range(len(matrix)))]
    
    selected_rows = random.sample(non_zero_rows, rows)
    selected_cols = random.sample(non_zero_cols, cols)
    
    submatrix = [[matrix[i][j] for j in selected_cols] for i in selected_rows]
    
    return submatrix

def longest_common_subsequence(sequences: List[List[int]], subsequence: List[int]) -> List[int]:
    lcs_lengths = []
    
    for seq in sequences:
        dp = [[0] * (len(subsequence) + 1) for _ in range(len(seq) + 1)]
        for i in range(1, len(seq) + 1):
            for j in range(1, len(subsequence) + 1):
                if seq[i - 1] == subsequence[j - 1]:
                    dp[i][j] = dp[i - 1][j - 1] + 1
                else:
                    dp[i][j] = max(dp[i - 1][j], dp[i][j - 1])
        lcs_lengths.append(dp[len(seq)][len(subsequence)])
    
    return lcs_lengths

def min_sum_subset_with_constraint(nums, k, max_diff):
    nums.sort()
    selected_elements = []
    current_sum = 0
    
    for num in nums:
        if len(selected_elements) < k and (not selected_elements or num - selected_elements[-1] <= max_diff):
            selected_elements.append(num)
            current_sum += num
    
    return selected_elements, current_sum

def min_stone_size(numbers: List[int], k: int) -> int:
    if not numbers or k >= len(numbers):
        return 0
    
    pq = [-num for num in numbers]
    heapq.heapify(pq)
    
    for _ in range(k):
        heapq.heappop(pq)
    
    return -min(pq)
```

File: slcs.py:

```Python
from typing import List
from typing import List, Tuple
from typing import List, Set
from difflib import get_close_matches
from itertools import combinations
from typing import List, Dict
from nltk.sentiment.vader import SentimentIntensityAnalyzer

def maximum_sum_path(triangle: List[List[int]]) -> List[int]:
    rows = len(triangle)
    dp = [[0] * len(row) for row in triangle]
    dp[0][0] = triangle[0][0]
    
    for i in range(1, rows):
        for j in range(len(triangle[i])):
            if j == 0:
                dp[i][j] = dp[i - 1][j] + triangle[i][j]
            elif j == len(triangle[i]) - 1:
                dp[i][j] = dp[i - 1][j - 1] + triangle[i][j]
            else:
                dp[i][j] = max(dp[i - 1][j - 1], dp[i - 1][j]) + triangle[i][j]
    
    max_sum = max(dp[-1])
    max_index = dp[-1].index(max_sum)
    max_path = [max_sum]
    for i in range(rows - 2, -1, -1):
        if max_index == 0:
            max_path.insert(0, dp[i][max_index])
            max_index = max_index
        elif max_index == len(triangle[i]) - 1:
            max_path.insert(0, dp[i][max_index - 1])
            max_index = max_index - 1
        else:
            if dp[i][max_index - 1] > dp[i][max_index]:
                max_path.insert(0, dp[i][max_index - 1])
                max_index = max_index - 1
            else:
                max_path.insert(0, dp[i][max_index])
                max_index = max_index
    
    return max_path

def max_path_sum(grid: List[List[int]]) -> int:
    rows, cols = len(grid), len(grid[0])
    dp = [[0] * cols for _ in range(rows)]
    
    dp[0][0] = grid[0][0]
    for col in range(1, cols):
        dp[0][col] = dp[0][col-1] + grid[0][col]
    for row in range(1, rows):
        dp[row][0] = dp[row-1][0] + grid[row][0]
    
    for row in range(1, rows):
        for col in range(1, cols):
            dp[row][col] = max(dp[row-1][col], dp[row][col-1]) + grid[row][col]
    
    return dp[rows-1][cols-1]

def slcs(sequences: List[List[int]], k: int) -> List[int]:
    if not sequences:
        return []
    
    lengths = [[0] * (k + 1) for _ in range(len(sequences[0]) + 1)]
    
    for seq in sequences[1:]:
        for i in range(1, len(sequences[0]) + 1):
            for j in range(1, k + 1):
                if sequences[0][i - 1] == seq[j - 1]:
                    lengths[i][j] = lengths[i - 1][j - 1] + 1
                else:
                    lengths[i][j] = max(lengths[i - 1][j], lengths[i][j - 1])
    
    slcs = []
    i, j = len(sequences[0]), k
    while i > 0 and j > 0:
        if sequences[0][i - 1] == sequences[1][j - 1]:
            if (i, j) != (len(sequences[0]), k):
                slcs.append(sequences[0][i - 1])
            i -= 1
            j -= 1
        elif lengths[i - 1][j] > lengths[i][j - 1]:
            i -= 1
        else:
            j -= 1
    
    return slcs[::-1]

def trading_simulator(prices: List[float], transactions: List[str]) -> float:
    stack = []
    profit = 0
    
    for i, transaction in enumerate(transactions):
        if transaction == 'buy':
            stack.append(prices[i])
        elif transaction == 'sell' and stack:
            buy_price = stack.pop()
            profit += prices[i] - buy_price
    
    return profit

def merge_intervals(intervals: List[Tuple[int, int]]) -> List[Tuple[int, int]]:
    if not intervals:
        return []
    
    # Sort intervals based on the start time
    intervals.sort(key=lambda x: x[0])
    
    merged = []
    current_interval = intervals[0]
    
    for next_interval in intervals[1:]:
        if current_interval[1] >= next_interval[0]:  # Overlapping intervals
            current_interval = (current_interval[0], max(current_interval[1], next_interval[1]))
        else:
            merged.append(current_interval)
            current_interval = next_interval
    
    merged.append(current_interval)  # Add the last interval
    return merged

def lcs(sequences: List[List[int]], k: int) -> List[int]:
    if not sequences:
        return []
    
    lengths = [[0] * (k + 1) for _ in range(len(sequences[0]) + 1)]
    
    for seq in sequences[1:]:
        for i in range(1, len(sequences[0]) + 1):
            for j in range(1, k + 1):
                if sequences[0][i - 1] == seq[j - 1]:
                    lengths[i][j] = lengths[i - 1][j - 1] + 1
                else:
                    lengths[i][j] = max(lengths[i - 1][j], lengths[i][j - 1])
    
    lcs = []
    i, j = len(sequences[0]), k
    while i > 0 and j > 0:
        if sequences[0][i - 1] == sequences[1][j - 1]:
            lcs.append(sequences[0][i - 1])
            i -= 1
            j -= 1
        elif lengths[i - 1][j] > lengths[i][j - 1]:
            i -= 1
        else:
            j -= 1
    
    return lcs[::-1]

def spell_check_and_correct(sentences: List[str], dictionary: Set[str]) -> List[str]:
    corrected_sentences = []
    
    for sentence in sentences:
        words = sentence.split()
        corrected_words = []
        
        for word in words:
            if word.lower() in dictionary:
                corrected_words.append(word)
            else:
                correction = get_close_matches(word.lower(), dictionary, n=1)
                corrected_words.append(correction[0] if correction else word)
        
        corrected_sentences.append(' '.join(corrected_words))
        
    return corrected_sentences

def unique_combinations_with_threshold(seq, r):
    seq = sorted(set(seq))  # Remove duplicates and sort
    combinations_list = combinations(seq, r)

    # Determine T (the distance threshold) based on the unique elements
    T = min(seq[i+1] - seq[i] for i in range(len(seq) - 1)) if len(seq) > 1 else float('inf')
    
    filtered_combinations = []
    for comb in combinations_list:
        if all(abs(comb[i] - comb[j]) >= T for i in range(len(comb)) for j in range(i + 1, len(comb))):
            filtered_combinations.append(comb)
    
    return sorted(filtered_combinations)

def rotate_array(arr: List[int], n: int) -> List[int]:
    length = len(arr)
    if length == 0:
        return arr
    n = n % length  # normalize n
    if n == 0:
        return arr
    
    # Reverse the whole array
    arr.reverse()
    # Reverse the first n elements
    arr[:n] = reversed(arr[:n])
    # Reverse the rest of the elements
    arr[n:] = reversed(arr[n:])
    
    return arr

def length_of_longest_substring(s: str) -> int:
    char_set = set()
    left = 0
    max_length = 0
    
    for right in range(len(s)):
        while s[right] in char_set:
            char_set.remove(s[left])
            left += 1
        char_set.add(s[right])
        max_length = max(max_length, right - left + 1)
        
    return max_length

def sentiment_analysis_twitter(twitter_data: List[Dict], keywords: List[str], sentiment_threshold: float) -> Dict[str, float]:
    if not twitter_data or not keywords:
        return {}
    
    sia = SentimentIntensityAnalyzer()
    result = {}
    
    for tweet in twitter_data:
        tweet_text = tweet['text']
        sentiment_score = sia.polarity_scores(tweet_text)['compound']
        if sentiment_score >= sentiment_threshold:
            for keyword in keywords:
                if keyword.lower() in tweet_text.lower():
                    if tweet['user'] not in result:
                        result[tweet['user']] = []
                    result[tweet['user']].append(sentiment_score)
    
    for user in result:
        result[user] = sum(result[user]) / len(result[user])
    
    return result
```

File: majority_finder.py:

```Python
from typing import List
from collections import defaultdict
import math
from typing import Tuple
import heapq
from typing import List, Tuple

def sliding_window(time_series: List[float], window_size: int) -> List[List[float]]:
    # Smooth data using median filter
    smoothed_data = []
    for i in range(len(time_series)):
        window = time_series[max(0, i - window_size // 2): min(len(time_series), i + window_size // 2 + 1)]
        smoothed_data.append(sorted(window)[len(window) // 2])
    
    # Segment time series data
    segmented_data = []
    for i in range(0, len(smoothed_data), window_size):
        segmented_data.append(smoothed_data[i: min(len(smoothed_data), i + window_size)])
    
    return segmented_data

def text_segmenter(text: str, window_size: int, step_size: int) -> List[str]:
    words = text.split()
    word_freq = defaultdict(int)
    window_word_freq = defaultdict(int)
    segment_boundaries = [0]
    
    for start in range(0, len(words), step_size):
        if start + window_size <= len(words):
            for word in words[start:start + window_size]:
                window_word_freq[word] += 1
            
            entropy = 0
            for word, freq in window_word_freq.items():
                prob = freq / window_size
                entropy -= prob * math.log2(prob)
            
            for word in words[start:start + window_size]:
                if word not in word_freq:
                    word_freq[word] = defaultdict(int)
                
                word_freq[word][entropy] += 1
            
            max_entropy_change = 0
            max_entropy_change_index = -1
            
            for i in range(start + window_size, len(words)):
                entropy_change = 0
                
                for word in words[i:i + window_size]:
                    if word not in word_freq:
                        word_freq[word] = defaultdict(int)
                    
                    entropy_change += word_freq[word][i] - word_freq[word][i - step_size]
                
                if entropy_change > max_entropy_change:
                    max_entropy_change = entropy_change
                    max_entropy_change_index = i
            
            if max_entropy_change_index != -1:
                segment_boundaries.append(max_entropy_change_index)
        
    segments = []
    for i in range(len(segment_boundaries) - 1):
        segments.append(' '.join(words[segment_boundaries[i]:segment_boundaries[i + 1]]))
    
    return segments

def is_magic_square(matrix: List[List[int]]) -> bool:
    row_sum = sum(matrix[0])
    
    # Check rows
    for row in matrix:
        if sum(row) != row_sum:
            return False
    
    # Check columns
    for col in range(len(matrix[0])):
        if sum(matrix[row][col] for row in range(len(matrix))) != row_sum:
            return False
    
    # Check diagonals
    diagonal1_sum = sum(matrix[i][i] for i in range(len(matrix)))
    diagonal2_sum = sum(matrix[i][len(matrix) - i - 1] for i in range(len(matrix)))
    
    return diagonal1_sum == row_sum and diagonal2_sum == row_sum

def encode_text_and_count(text: str, encoding: str) -> Tuple[bytes, int]:
    byte_representation = text.encode(encoding)
    non_ascii_count = sum(1 for char in text if ord(char) > 127)
    
    return byte_representation, non_ascii_count

def huffman_coding(text: str) -> dict:
    if not text:
        return {}
    
    frequency = {}
    for char in text:
        if char in frequency:
            frequency[char] += 1
        else:
            frequency[char] = 1
            
    priority_queue = [[weight, [symbol, ""]] for symbol, weight in frequency.items()]
    heapq.heapify(priority_queue)
    
    while len(priority_queue) > 1:
        lo = heapq.heappop(priority_queue)
        hi = heapq.heappop(priority_queue)
        for pair in lo[1:]:
            pair[1] = '0' + pair[1]
        for pair in hi[1:]:
            pair[1] = '1' + pair[1]
        heapq.heappush(priority_queue, [lo[0] + hi[0]] + lo[1:] + hi[1:])
                
    return sorted(heapq.heappop(priority_queue)[1:], key=lambda p: (len(p[-1]), p))

def majority_elements(arr: List[int]) -> List[int]:
    count = {}
    n = len(arr)
    
    for num in arr:
        count[num] = count.get(num, 0) + 1
    
    return [num for num, cnt in count.items() if cnt > n / 3]

def calculate_fuel_efficiency(distances: List[float], fuel_consumed: List[float]) -> Tuple[List[float], float]:
    fuel_efficiencies = []
    for distance, fuel in zip(distances, fuel_consumed):
        if fuel == 0:
            continue  # Avoid division by zero
        efficiency = distance / fuel
        fuel_efficiencies.append(efficiency)
    
    max_efficiency = max(fuel_efficiencies) if fuel_efficiencies else 0.0
    
    return fuel_efficiencies, max_efficiency

def group_items_by_length(items: List[str], limit: int) -> List[List[str]]:
    groups = []
    current_group = []
    current_length = 0
    
    for item in items:
        item_length = len(item)
        if current_length + item_length > limit:
            groups.append(current_group)
            current_group = [item]
            current_length = item_length
        else:
            current_group.append(item)
            current_length += item_length
            
    if current_group:
        groups.append(current_group)
    
    return groups

def moving_averages(sequence: List[int], window_size: int) -> List[float]:
    if window_size > len(sequence) or window_size <= 0:
        return []
    
    averages = []
    
    for i in range(len(sequence) - window_size + 1):
        window_sum = sum(sequence[i:i + window_size])
        average = window_sum / window_size
        averages.append(average)
        
    return averages

def minimum_elements(arr: List[int], target: int) -> int:
    n = len(arr)
    if target == 0:
        return 0
    
    table = [float('inf')] * (target + 1)
    table[0] = 0
    
    for num in arr:
        for i in range(num, target + 1):
            table[i] = min(table[i], table[i - num] + 1)
    
    return table[target] if table[target] != float('inf') else -1

def high_value_coordinates(grid: List[List[int]], threshold: int) -> List[Tuple[Tuple[int, int], int]]:
    result = []
    for i in range(len(grid)):
        for j in range(len(grid[0])):
            if grid[i][j] > threshold:
                distance = abs(i) + abs(j)
                result.append(((i, j), distance))
    return result
```

File: knapsack_problems.py:

```Python
from typing import List
from collections import Counter
from typing import Dict, List
import random
import re
from typing import List, Tuple

def find_pattern_occurrences(n: int, arr: List[int], pattern: List[int]) -> List[int]:
    occurrences = []
    len_pattern = len(pattern)
    
    for i in range(n - len_pattern + 1):
        if arr[i:i + len_pattern] == pattern:
            occurrences.append(i)
    
    return occurrences

def top_n_frequent_words(string, n):
    words = string.lower().split()
    count = Counter(words)
    
    return [word for word, _ in count.most_common(n)]

def lowest_common_ancestor(tree: Dict[int, List[int]], root: int) -> int:
    ancestors = set()
    stack = [root]
    
    while stack:
        node = stack.pop()
        ancestors.add(node)
        
        for child in tree.get(node, []):
            stack.append(child)
    
    lca = root
    
    for node in ancestors:
        if all(node in ancestors for child in tree.get(node, [])):
            lca = node
    
    return lca

def pair_generator(num_pairs: int, max_num: int) -> List[List[int]]:
    if num_pairs > max_num * (max_num - 1) // 2:
        raise ValueError("num_pairs cannot be greater than the total possible pairs")
    
    pairs = set()
    while len(pairs) < num_pairs:
        pair = tuple(sorted((random.randint(1, max_num), random.randint(1, max_num))))
        if pair[0] != pair[1]:  # ensure the pair does not contain duplicate numbers
            pairs.add(pair)
    
    return [list(pair) for pair in pairs]

def extract_relevant_sentences(text: str, keywords: List[str]) -> List[str]:
    if not text or not keywords:
        return []
    
    sentences = re.split(r'[.!?]', text)
    sentences = [sentence.strip() for sentence in sentences if sentence]
    
    keyword_counts = Counter(keyword.lower() for keyword in keywords)
    
    relevant_sentences = []
    
    for sentence in sentences:
        sentence_keywords = [keyword for keyword in keywords if keyword.lower() in sentence.lower()]
        sentence_score = sum(keyword_counts[keyword.lower()] for keyword in sentence_keywords)
        
        if sentence_score > 0:
            relevant_sentences.append((sentence, sentence_score))
    
    relevant_sentences.sort(key=lambda x: x[1], reverse=True)
    
    return [sentence for sentence, _ in relevant_sentences]

def knapsack_max_value(n, capacity, items):
    dp = [0] * (capacity + 1)

    for value, weight in items:
        for w in range(capacity, weight - 1, -1):
            dp[w] = max(dp[w], dp[w - weight] + value)

    return dp[capacity]

def compute_weight_distances(n: int, weights: List[int], pairs: List[Tuple[int, int]]) -> int:
    total_distance = 0
    for i, j in pairs:
        if i < 0 or i >= n or j < 0 or j >= n:
            raise IndexError("Index out of bounds")
        total_distance += abs(weights[i] - weights[j])
    return total_distance

def kmeans_clustering(data: List[List[float]], k: int) -> List[int]:
    centroids = random.sample(data, k)
    cluster_assignments = [0] * len(data)
    
    while True:
        new_cluster_assignments = []
        for i, point in enumerate(data):
            min_distance = float('inf')
            cluster_index = 0
            for j, centroid in enumerate(centroids):
                distance = sum((a - b) ** 2 for a, b in zip(point, centroid))
                if distance < min_distance:
                    min_distance = distance
                    cluster_index = j
            new_cluster_assignments.append(cluster_index)
        
        if new_cluster_assignments == cluster_assignments:
            break
        
        cluster_assignments = new_cluster_assignments
        
        for i in range(k):
            points_in_cluster = [point for j, point in enumerate(data) if cluster_assignments[j] == i]
            if points_in_cluster:
                centroids[i] = [sum(x) / len(points_in_cluster) for x in zip(*points_in_cluster)]
    
    return cluster_assignments

def three_sum_unique(arr, target):
    arr.sort()
    unique_triplets = []
    
    n = len(arr)
    for i in range(n):
        if i > 0 and arr[i] == arr[i - 1]:
            continue
            
        left, right = i + 1, n - 1
        while left < right:
            current_sum = arr[i] + arr[left] + arr[right]
            if current_sum == target:
                unique_triplets.append((arr[i], arr[left], arr[right]))
                while left < right and arr[left] == arr[left + 1]:
                    left += 1
                while left < right and arr[right] == arr[right - 1]:
                    right -= 1
                left += 1
                right -= 1
            elif current_sum < target:
                left += 1
            else:
                right -= 1

    return unique_triplets

def find_first_peak(sequence: List[int]) -> int:
    low, high = 0, len(sequence) - 1
    
    while low < high:
        mid = low + (high - low) // 2
        
        if sequence[mid] > sequence[mid + 1]:
            high = mid
        else:
            low = mid + 1
    
    if low == 0 and sequence[low] > sequence[1]:
        return sequence[low]
    elif low == len(sequence) - 1 and sequence[low] > sequence[low - 1]:
        return sequence[low]
    elif sequence[low] > sequence[low - 1] and sequence[low] > sequence[low + 1]:
        return sequence[low]
    
    return -1

def closest_pair_equal_elements(nums: List[int]) -> int:
    if len(nums) < 2:
        raise ValueError("List has less than two elements")
    
    nums.sort()
    min_diff = float('inf')
    
    for i in range(1, len(nums)):
        if nums[i] == nums[i - 1]:
            min_diff = min(min_diff, i - (i - 1))
    
    if min_diff == float('inf'):
        raise ValueError("No pairs of equal elements")
    
    return min_diff
```

File: dna_analysis.py:

```Python
from typing import List
from typing import List, Tuple, Dict
from typing import Dict
from typing import List, Dict
from collections import defaultdict
from collections import deque
import re
from collections import Counter
import math

def align_sequences(sequences: List[List[int]], gap_penalty: int) -> List[List[int]]:
    m, n = len(sequences[0]), len(sequences[1])
    dp = [[0 for _ in range(n + 1)] for _ in range(m + 1)]
    
    for i in range(m + 1):
        dp[i][0] = gap_penalty * i
    for j in range(n + 1):
        dp[0][j] = gap_penalty * j
    
    for i in range(1, m + 1):
        for j in range(1, n + 1):
            match = dp[i - 1][j - 1] + (sequences[0][i - 1] == sequences[1][j - 1])
            delete = dp[i - 1][j] + gap_penalty
            insert = dp[i][j - 1] + gap_penalty
            dp[i][j] = max(match, delete, insert)
    
    aligned_sequences = [[], []]
    i, j = m, n
    while i > 0 or j > 0:
        if i > 0 and j > 0 and dp[i][j] == dp[i - 1][j - 1] + (sequences[0][i - 1] == sequences[1][j - 1]):
            aligned_sequences[0].append(sequences[0][i - 1])
            aligned_sequences[1].append(sequences[1][j - 1])
            i -= 1
            j -= 1
        elif i > 0 and dp[i][j] == dp[i - 1][j] + gap_penalty:
            aligned_sequences[0].append(sequences[0][i - 1])
            aligned_sequences[1].append(-1)
            i -= 1
        else:
            aligned_sequences[0].append(-1)
            aligned_sequences[1].append(sequences[1][j - 1])
            j -= 1
    
    return [aligned_sequences[0][::-1], aligned_sequences[1][::-1]]

def process_transactions(transactions: List[Tuple[int, int, str]]) -> Dict[int, int]:
    balances = {}
    
    for account, amount, transaction_type in transactions:
        if account not in balances:
            balances[account] = 0
        
        if transaction_type == "deposit":
            balances[account] += amount
        elif transaction_type == "withdrawal":
            balances[account] -= amount
    
    return balances

def update_matrix(mat: List[List[int]], row: int, col: int, val: int) -> List[List[int]]:
    if mat[row][col] == val:
        return mat
    
    mat[row][col] = val
    for j in range(len(mat[0])):
        if j != col:
            mat[row][j] = 0
    for i in range(len(mat)):
        if i != row:
            mat[i][col] = 0
    
    return mat

def find_target_row(matrix: List[List[int]], target_row: List[int]) -> int:
    target_row_set = set(target_row)
    for i, row in enumerate(matrix):
        if set(row) >= target_row_set:
            return i
    return -1

def ngram_index(text: str, max_window_size: int) -> Dict[str, int]:
    text = text.lower().split()
    index = {}
    
    for window_size in range(1, max_window_size + 1):
        for i in range(len(text) - window_size + 1):
            ngram = ' '.join(text[i:i + window_size])
            index[ngram] = index.get(ngram, 0) + 1
    
    return index

def evaluate_students(students: List[List[int]], threshold: int) -> Dict[int, str]:
    results = {}
    for i, student in enumerate(students):
        average_grade = sum(student) / len(student)
        if average_grade >= threshold:
            results[i] = "Pass"
        else:
            results[i] = "Fail"
    return results

def most_frequent_motif(sequences: List[str], k: int) -> str:
    if not sequences or k > len(sequences[0]):
        return "k is larger than the sequence length"
    
    motif_count = defaultdict(int)
    for sequence in sequences:
        for i in range(len(sequence) - k + 1):
            motif = sequence[i:i + k]
            motif_count[motif] += 1
    
    return max(motif_count, key=motif_count.get)

def precision_rounding(numbers: List[float], precision: int) -> List[float]:
    cumulative_error = 0
    rounded_numbers = []
    
    for num in numbers:
        rounded_num = round(num + cumulative_error, precision)
        cumulative_error += (num - rounded_num)
        rounded_numbers.append(rounded_num)
    
    return rounded_numbers

def median_component(graph: List[List[int]], vertices: int) -> List[List[List[int]]]:
    total_distance = 0
    distance_matrix = [[float('inf')] * vertices for _ in range(vertices)]
    
    for i in range(vertices):
        distance_matrix[i][i] = 0
    
    for u, v in graph:
        distance_matrix[u][v] = distance_matrix[v][u] = 1
    
    for k in range(vertices):
        for i in range(vertices):
            for j in range(vertices):
                distance_matrix[i][j] = min(distance_matrix[i][j], distance_matrix[i][k] + distance_matrix[k][j])
                total_distance += distance_matrix[i][j]
    
    median_distance = total_distance // (vertices * (vertices - 1) // 2)
    
    visited = [False] * vertices
    median_component = []
    subgraph1 = []
    subgraph2 = []
    
    for start in range(vertices):
        if not visited[start]:
            queue = deque([start])
            visited[start] = True
            subgraph = [start]
            
            while queue:
                node = queue.popleft()
                for neighbor, edge_length in enumerate(distance_matrix[node]):
                    if edge_length == median_distance and not visited[neighbor]:
                        queue.append(neighbor)
                        visited[neighbor] = True
                        subgraph.append(neighbor)
            
            median_component.append(subgraph)
            if len(subgraph) > len(median_component[0]):
                subgraph1 = median_component[0]
                median_component[0] = subgraph
            else:
                subgraph2 = subgraph
    
    return [subgraph1, subgraph2]

def tf_idf(text: str, stopwords: List[str]) -> List[tuple]:
    # Tokenize the text into words
    words = re.findall(r'\b\w+\b', text.lower())
    
    # Remove stopwords
    words = [word for word in words if word not in stopwords]
    
    # Calculate term frequency (TF)
    tf = Counter(words)
    tf = {word: count / len(words) for word, count in tf.items()}
    
    # Calculate inverse document frequency (IDF)
    idf = {word: math.log(1 + 1 / (1 + tf[word])) for word in tf}
    
    # Calculate TF-IDF scores
    tf_idf_scores = {word: tf[word] * idf[word] for word in tf}
    
    # Return the top keywords with their TF-IDF scores
    return sorted(tf_idf_scores.items(), key=lambda x: x[1], reverse=True)[:10]

def max_profit_with_fee(prices, fee):
    cash = 0
    hold = -prices[0]
    
    for price in prices:
        cash = max(cash, hold + price - fee)  # Sell operation
        hold = max(hold, cash - price)        # Buy operation
    
    return cash
```

File: matrix_generator.py:

```Python
import numpy as np
from typing import List, Dict, Tuple
from typing import List
import re
from collections import deque
from typing import List, Tuple
from itertools import combinations

def generate_matrix_with_condition(size, threshold):
    matrix = np.random.randint(0, threshold, size=(size, size)).tolist()
    condition_met = False
    
    for row in matrix:
        if sum(row) > threshold / 2:
            condition_met = True
            break
    
    for col in range(size):
        if sum(matrix[row][col] for row in range(size)) > threshold / 2:
            condition_met = True
            break
    
    return matrix, condition_met

def svd_reconstruction(matrix, k):
    # Perform SVD on the matrix
    U, s, Vh = np.linalg.svd(matrix, full_matrices=False)
    
    # Retain only the top-k singular values and singular vectors
    Uk = U[:, :k]
    sk = s[:k]
    Vkh = Vh[:k, :]
    
    # Reconstruct the matrix from the retained singular values and singular vectors
    reconstructed_matrix = Uk @ np.diag(sk) @ Vkh
    
    return reconstructed_matrix

def dbscan_clustering(points: List[Tuple[float, float]], epsilon: float, min_samples: int) -> Dict[int, List[Tuple[float, float]]]:
    from sklearn.cluster import DBSCAN
    clustering = DBSCAN(eps=epsilon, min_samples=min_samples).fit(points)
    clusters = {}
    for i, label in enumerate(clustering.labels_):
        if label not in clusters:
            clusters[label] = []
        clusters[label].append(points[i])
    
    return clusters

def largest_submatrix(matrix: List[List[int]], target: int) -> int:
    rows, cols = len(matrix), len(matrix[0])
    prefix_sum = [[0] * (cols + 1) for _ in range(rows + 1)]
    
    for i in range(1, rows + 1):
        for j in range(1, cols + 1):
            prefix_sum[i][j] = matrix[i - 1][j - 1] + prefix_sum[i - 1][j] + prefix_sum[i][j - 1] - prefix_sum[i - 1][j - 1]
    
    max_size = 0
    for i in range(rows):
        for j in range(cols):
            for k in range(i + 1, rows + 1):
                for end_col in range(j + 1, cols + 1):
                    submatrix_sum = prefix_sum[k][end_col] - prefix_sum[k][j] - prefix_sum[i][end_col] + prefix_sum[i][j]
                    if submatrix_sum <= target:
                        max_size = max(max_size, (k - i) * (end_col - j))
    
    return max_size

def sentence_extractor(text: str, keywords: List[str]) -> List[str]:
    sentences = re.split(r'[.!?]', text)
    extracted_sentences = []
    
    for sentence in sentences:
        sentence = re.sub(r'[^\w\s]', '', sentence).strip()
        if any(keyword.lower() in sentence.lower() for keyword in keywords):
            extracted_sentences.append(sentence)
            
    return extracted_sentences

def bidirectional_search(graph: List[List[int]], start_node: int, end_node: int) -> List[int]:
    num_nodes = len(graph)
    start_queue = deque([start_node])
    end_queue = deque([end_node])
    start_visited = [False] * num_nodes
    end_visited = [False] * num_nodes
    start_parent = [None] * num_nodes
    end_parent = [None] * num_nodes
    
    while start_queue or end_queue:
        if start_queue:
            current_node = start_queue.popleft()
            start_visited[current_node] = True
            for neighbor, edge in enumerate(graph[current_node]):
                if edge == 1 and not start_visited[neighbor]:
                    start_queue.append(neighbor)
                    start_parent[neighbor] = current_node
                    if end_visited[neighbor]:
                        break
        if end_queue:
            current_node = end_queue.popleft()
            end_visited[current_node] = True
            for neighbor, edge in enumerate(graph[current_node]):
                if edge == 1 and not end_visited[neighbor]:
                    end_queue.append(neighbor)
                    end_parent[neighbor] = current_node
                    if start_visited[neighbor]:
                        break
        else:
            continue
        break
    if current_node is None:
        return []
    
    path = []
    while current_node is not None:
        path.append(current_node)
        current_node = start_parent[current_node] if current_node != start_node else None
    path.reverse()
    
    for i in range(1, len(path)):
        current_node = end_parent[path[i]]
        while current_node != path[i]:
            path.insert(i, current_node)
            current_node = end_parent[current_node]
    
    return path

def longest_allowed_substring(s: str, allowed_chars: set) -> str:
    max_length = 0
    max_substr = ""
    current_substr = ""
    
    for char in s:
        if char in allowed_chars:
            current_substr += char
            if len(current_substr) > max_length:
                max_length = len(current_substr)
                max_substr = current_substr
        else:
            current_substr = ""
    
    return max_substr

def negative_cycle_detector(edges: List[Tuple[int, int, int]], vertices: int) -> Tuple[List[List[int]], List[int]]:
    distances = [[float('inf')]*vertices for _ in range(vertices)]
    
    for _ in range(vertices-1):
        for u, v, w in edges:
            distances[u][v] = min(distances[u][v], distances[u][u] + w)
    
    negative_cycle_vertices = []
    for u, v, w in edges:
        if distances[u][v] > distances[u][u] + w:
            distances[u][v] = distances[u][u] + w
            negative_cycle_vertices.append(v)
    
    return distances, negative_cycle_vertices

def subsets_with_target_mean(arr: List[int], target_mean: float) -> List[List[int]]:
    target_sum = target_mean * 2  # Start with a base, we need at least 2 elements to compute mean
    result_subsets = []
    
    n = len(arr)
    for r in range(2, n + 1):
        for subset in combinations(arr, r):
            if sum(subset) == target_sum and len(subset) > 0:
                result_subsets.append(list(subset))
    
    return result_subsets

def floyd_cycle_detection(numbers, precision):
    tortoise = numbers[0]
    hare = numbers[0]
    
    while True:
        tortoise = numbers[int(tortoise * precision) % len(numbers)]
        hare = numbers[int(numbers[int(hare * precision) % len(numbers)] * precision) % len(numbers)]
        
        if abs(tortoise - hare) < 1e-6:
            break
    
    ptr1 = numbers[0]
    ptr2 = tortoise
    
    while abs(ptr1 - ptr2) >= 1e-6:
        ptr1 = numbers[int(ptr1 * precision) % len(numbers)]
        ptr2 = numbers[int(ptr2 * precision) % len(numbers)]
    
    cycle_length = 1
    ptr2 = numbers[int(ptr2 * precision) % len(numbers)]
    
    while abs(ptr1 - ptr2) >= 1e-6:
        ptr2 = numbers[int(ptr2 * precision) % len(numbers)]
        cycle_length += 1
    
    return (cycle_length > 1, cycle_length)

def validate_parentheses(text: str, max_depth: int) -> bool:
    stack = []
    depth = 0
    
    for char in text:
        if char == '(':
            stack.append(char)
            depth += 1
            
            if depth > max_depth:
                return False
        elif char == ')':
            if not stack:
                return False
            
            stack.pop()
            depth -= 1
    
    return not stack
```

File: route_optimization.py:

```Python
from typing import List
import itertools
from collections import deque
from typing import List, Tuple, Dict
import math
from collections import Counter
import re
from typing import List, Dict
from typing import List, Tuple
import sys
import heapq
from typing import Dict, List, Tuple, Optional

def find_k_sum_combinations(num_list: List[int], target_sum: int, k: int) -> List[List[int]]:
    if len(num_list) < k:
        return []
    
    num_list.sort()
    result = set()
    
    for comb in itertools.combinations(num_list, k):
        if sum(comb) == target_sum:
            result.add(tuple(sorted(comb)))
    
    return [list(comb) for comb in sorted(result)]

def assign_events(intervals: List[List[int]], capacities: List[int], num_rooms: int, events: List[int]) -> List[List[int]]:
    intervals.sort(key=lambda x: x[0])  # Sort intervals by start time
    room_assigned_events = [[] for _ in range(num_rooms)]  # Initialize room events
    room_available_times = [0] * num_rooms  # Initialize room available times
    
    for start, end in intervals:
        room_idx = -1
        earliest_available_time = float('inf')
        
        for i, available_time in enumerate(room_available_times):
            if available_time <= start and len(room_assigned_events[i]) < capacities[i] and available_time < earliest_available_time:
                room_idx = i
                earliest_available_time = available_time
        
        if room_idx != -1:
            room_assigned_events[room_idx].append(events[0])
            room_available_times[room_idx] = end
            events.pop(0)
    
    return room_assigned_events

def min_water_needed(trees: List[List[int]], target_height: int) -> int:
    total_water = 0
    queue = deque([(i, x) for i, level in enumerate(trees) for x in level])
    visited = set((x for level in trees for x in level))
    
    while queue:
        current_level, current_node = queue.popleft()
        
        if current_level >= target_height:
            break
        
        for next_node in trees[current_level + 1]:
            if next_node not in visited and abs(next_node - current_node) <= 1:
                queue.append((current_level + 1, next_node))
                visited.add(next_node)
                total_water += 1
    
    return total_water

def markov_chain_simulator(matrix: List[List[float]], initial_state: List[float], steps: int) -> List[float]:
    state_probabilities = initial_state
    
    for _ in range(steps):
        state_probabilities = [sum([state_probabilities[j] * matrix[j][i] for j in range(len(state_probabilities))]) for i in range(len(state_probabilities))]
    
    return state_probabilities

def classify_points_with_minkowski_distance(points: List[Tuple[float, float]], radius: float) -> Dict[Tuple[float, float], str]:
    classification = {}
    
    for point in points:
        distance = (abs(point[0]) ** 2 + abs(point[1]) ** 2) ** 0.5
        if distance < radius:
            classification[point] = "within"
        elif distance > radius:
            classification[point] = "outside"
        else:
            classification[point] = "on"
    
    return classification

def common_words(text: str, threshold: int) -> List[str]:
    words = re.findall(r'\b\w+\b', text.lower())
    word_freq = Counter(words)
    common_words = [word for word, freq in word_freq.items() if freq >= threshold]
    common_words.sort(key=lambda word: word_freq[word], reverse=True)
    
    return common_words

def evaluate_expressions(arithmetic_expressions: List[str], variables: Dict[str, int]) -> List[int]:
    evaluated_values = []
    
    for expression in arithmetic_expressions:
        expression = expression.replace(' ', '')
        
        for var, value in variables.items():
            expression = expression.replace(var, str(value))
        
        try:
            evaluated_values.append(eval(expression))
        except ZeroDivisionError:
            evaluated_values.append(None)
    
    return evaluated_values

def min_trucks(routes: List[List[int]], capacity: int) -> int:
    demand = [0] * len(routes)
    for i, route in enumerate(routes):
        demand[i] = max(route)
    
    return sum((d + capacity - 1) // capacity for d in demand)

def max_length_intervals(intervals: List[List[int]], k: int) -> List[List[int]]:
    intervals.sort(key=lambda x: x[1])
    dp = [[None for _ in range(k + 1)] for _ in range(len(intervals) + 1)]
    result = []
    
    for i in range(1, len(intervals) + 1):
        for j in range(1, min(i + 1, k + 1)):
            max_length = 0
            prev_interval = None
            for prev in range(i):
                if intervals[prev][1] <= intervals[i - 1][0] and dp[prev][j - 1] is not None:
                    length = intervals[i - 1][1] - intervals[i - 1][0] + dp[prev][j - 1][0]
                    if length > max_length:
                        max_length = length
                        prev_interval = prev
            if max_length > 0:
                dp[i][j] = (max_length, intervals[i - 1])
                if prev_interval is not None:
                    dp[i][j] += dp[prev_interval][j - 1][1:]
    
    if dp[-1][-1] is not None:
        result = [dp[-1][-1][1]]
        i, j = len(intervals), k
        while j > 1:
            i = dp[i][j][2]
            result.append(dp[i][j - 1][1])
            j -= 1
        result.reverse()
    
    return result

def expected_heads(probabilities: List[List[float]], n: int) -> float:
    rows, cols = len(probabilities), len(probabilities[0])
    
    expected_heads = [[0.0] * cols for _ in range(rows)]
    expected_heads[0] = [p[0] for p in probabilities[0]]
    
    for i in range(1, rows):
        for j in range(cols):
            expected_heads[i][j] = (expected_heads[i - 1][j] * probabilities[i - 1][j][0] +
                                    expected_heads[i - 1][j - 1] * probabilities[i - 1][j - 1][1] +
                                    (j + 1) * probabilities[i][j][1])
    
    return expected_heads[-1][-1]

def find_shortest_path(adjacency_list: Dict[int, List[Tuple[int, int]]], source: int, target: int) -> Optional[Tuple[int, List[int]]]:
    queue = [(0, source, [])]
    seen = set()
    while queue:
        (dist, node, path) = heapq.heappop(queue)
        if node not in seen:
            seen.add(node)
            path = path + [node]
            if node == target:
                return (dist, path)
            for neighbor, neigh_dist in adjacency_list[node]:
                if neighbor not in seen:
                    heapq.heappush(queue, (dist + neigh_dist, neighbor, path))
    return None
```

--------------------------------------------------------------------------------------------------

Problem Statement: Parameters:
- sequence: str # A sequence of characters from which we will extract common substrings.
- k: int # The length of the substrings to consider for frequency calculation.
- threshold: float # The minimum frequency for a substring to be considered common.
- n: int # Number of elements in the list from which to find the closest triplet sum.
- arr: List[int] # Input list of integers for finding the closest triplet sum.
- x: int # The target number for which the closest sum of three elements will be calculated.
- numbers: List[float] # A list of numbers to compute statistical measures.
- precision: int # The number of decimal places to round the statistical measures.
- stats: List[str] # A list of statistical measures to calculate.
- items: List[Tuple[int, int]] # Input items for solving the knapsack problem, represented by (value, weight).
- capacity: int # The maximum capacity of the knapsack.
- routes: List[List[int]] # A list of routes represented by a list of nodes.
- truck_capacity: int # The capacity of each truck for delivering goods.

Objectives:
- Calculate the frequency of each substring of length `k` in the given `sequence` using the common substring detection logic.
- Identify the common substrings that occur with a frequency above the specified `threshold` and store them.
- Find the three elements in the `arr` that produce the closest sum to the target `x`.
- Calculate specified statistical measures (mean, median, mode, standard deviation) for the list of `numbers`, rounding the results to the specified `precision`, and return the results in a dictionary.
- Solve a 0/1 Knapsack problem using the given `items` and `capacity` to maximize the total value, and return the maximum value achievable.
- Implement the logic to calculate the minimum number of trucks required to deliver goods along all `routes`, ensuring that the total demand for each route does not exceed the `truck_capacity`.
- Combine the results of the common substrings, closest triplet sum, statistical measures, maximum knapsack value, and minimum truck count into a single summary output.

Return Values:
- common_substrings_result: Dict[str, int] # A dictionary of common substrings and their frequencies based on the provided sequence and threshold.
- closest_triplet: List[int] # A list of three integers representing the closest triplet sum to the specified target.
- statistics: Dict[str, float] # A dictionary containing statistical measurements rounded to the specified precision.
- max_knapsack_value: int # The maximum value obtainable with the given items in the knapsack.
- min_truck_count: int # The minimum number of trucks required to fulfill all routes.

The name of the function you create should be aggregate_analysis and it should return a tuple.

--------------------------------------------------------------------------------------------------

Answer Code:
def aggregate_analysis(sequence: str, k: int, threshold: float, n: int, arr: List[int], x: int, 
                       numbers: List[float], precision: int, stats: List[str], items: List[Tuple[int, int]], 
                       capacity: int, routes: List[List[int]], truck_capacity: int) -> Tuple[Dict[str, int], List[int], Dict[str, float], int, int]:
    # Step 1: Use common substring function
    common_substrings_result = common_substrings(sequence, k, threshold)
    # Step 2: Use closest triplet sum function to get the closest triplet
    closest_triplet = closest_triplet_sum(n, arr, x)
    # Step 3: Use calculate statistics to get statistical measures
    statistics = calculate_statistics(numbers, precision, stats)
    # Step 4: Use the knapsack function to calculate the max value
    max_knapsack_value = knapsack_max_value(len(items), capacity, items)
    # Step 5: Calculate the minimum number of trucks needed
    min_truck_count = min_trucks(routes, truck_capacity)
    # Step 6: Create a summary output with all results
    return common_substrings_result, closest_triplet, statistics, max_knapsack_value, min_truck_count

--------------------------------------------------------------------------------------------------

Test Code:
# Import statements if required
from typing import List, Dict, Tuple
from collections import defaultdict
import statistics
import math

# Initialize input parameters
sequence = "abcabcabc"
k = 2
threshold = 0.25
n = 5
arr = [1, 2, 3, 4, 5]
x = 7
numbers = [1.5, 2.5, 3.5, 4.5, 5.5]
precision = 2
stats = ["mean", "median", "mode", "standard_deviation"]
items = [(60, 10), (100, 20), (120, 30)]
capacity = 50
routes = [[1, 2, 3], [2, 3, 4], [3, 4, 5]]
truck_capacity = 3

# Call function with input parameters
return_common_substrings, return_closest_triplet, return_statistics, return_max_knapsack_value, return_min_truck_count = aggregate_analysis(
    sequence, k, threshold, n, arr, x, numbers, precision, stats, items, capacity, routes, truck_capacity
)

# Step-by-step run-through of function to obtain intermediate outputs:

# Step 1
# Explanation: Calculate frequency of each substring of length `k`
frequencies = defaultdict(int)
for i in range(len(sequence) - k + 1):
    substring = sequence[i:i+k]
    frequencies[substring] += 1

# Calculate common substrings based on the frequency threshold
common_substrings_result = {substring: frequency for substring, frequency in frequencies.items() if frequency / len(sequence) >= threshold}

# Step 2
# Explanation: Find closest triplet sum
arr.sort()
closest_sum = float('inf')
closest_triplet = []

for i in range(n - 2):
    left, right = i + 1, n - 1 

    while left < right:
        current_sum = arr[i] + arr[left] + arr[right]

        if abs(current_sum - x) < abs(closest_sum - x):
            closest_sum = current_sum
            closest_triplet = [arr[i], arr[left], arr[right]]

        if current_sum < x:
            left += 1
        elif current_sum > x:
            right -= 1
        else:
            closest_triplet = [arr[i], arr[left], arr[right]]
            break

# Step 3
# Explanation: Calculate statistical measures
statistics_result = {}
for stat in stats:
    if stat == "mean":
        statistics_result["mean"] = round(statistics.mean(numbers), precision)
    elif stat == "median":
        statistics_result["median"] = round(statistics.median(numbers), precision)
    elif stat == "mode":
        statistics_result["mode"] = round(statistics.mode(numbers), precision)
    elif stat == "standard_deviation":
        statistics_result["standard_deviation"] = round(math.sqrt(sum((x - statistics.mean(numbers)) ** 2 for x in numbers) / len(numbers)), precision)

# Step 4
# Explanation: Calculate maximum value obtainable in the knapsack
dp = [0] * (capacity + 1)

for value, weight in items:
    for w in range(capacity, weight - 1, -1):
        dp[w] = max(dp[w], dp[w - weight] + value)

max_knapsack_value = dp[capacity]

# Step 5
# Explanation: Calculate minimum number of trucks needed
demand = [0] * len(routes)
for i, route in enumerate(routes):
    demand[i] = max(route)

min_truck_count = sum((d + truck_capacity - 1) // truck_capacity for d in demand)

# Final Expected Output:
correct_common_substrings = common_substrings_result
correct_closest_triplet = closest_triplet
correct_statistics = statistics_result
correct_max_knapsack_value = max_knapsack_value
correct_min_truck_count = min_truck_count

# Assert statements (compulsory) to check if the function returns the correct values:
assert return_common_substrings == correct_common_substrings
assert return_closest_triplet == correct_closest_triplet
assert return_statistics == correct_statistics
assert return_max_knapsack_value == correct_max_knapsack_value
assert return_min_truck_count == correct_min_truck_count

print('All-Pass')

--------------------------------------------------------------------------------------------------

