import torch
import numpy as np
from sklearn.cluster import KMeans


def find_optimal_k_elbow(rewards, max_k=12, min_k=1):
    std = rewards.std()
    if std < 1e-6:
        return 1
    
    rewards_np = rewards.cpu().numpy().reshape(-1, 1)
    
    actual_max_k = min(max_k + 1, len(rewards_np))

    if actual_max_k <= min_k:
        return 1
        
    inertias = []
    k_range = range(min_k, actual_max_k)
    
    for k in k_range:
        kmeans = KMeans(n_clusters=k, random_state=0, n_init='auto').fit(rewards_np)
        inertias.append(kmeans.inertia_)
    
    if not inertias:
        return 1

    try:
        diff1 = np.diff(inertias)
        diff2 = np.diff(diff1)
        optimal_k = k_range[np.argmax(diff2) + 1]
    except (ValueError, IndexError):
        optimal_k = min_k
        
    return optimal_k
