import json
from tabulate import tabulate

log_file_path = '/home/user/code/code_gen/api_2.log'

model_stats = {}

try:
    with open(log_file_path, 'r', encoding='utf-8') as file:
        for line_number, line in enumerate(file, 1):
            line = line.strip()
            if not line:
                continue
                
            try:
                data = json.loads(line)
                model = data['model_name']
                prompt_tokens = data['usage']['prompt_tokens']
                completion_tokens = data['usage']['completion_tokens']
                
                if model not in model_stats:
                    model_stats[model] = {
                        'total_prompt_tokens': 0,
                        'total_completion_tokens': 0,
                        'count': 0
                    }
                
                model_stats[model]['total_prompt_tokens'] += prompt_tokens
                model_stats[model]['total_completion_tokens'] += completion_tokens
                model_stats[model]['count'] += 1
                
            except json.JSONDecodeError as e:
                print(f"Warning: JSON decode error on line {line_number}: {e}")
            except KeyError as e:
                print(f"Warning: Missing key {e} on line {line_number}")
                
except FileNotFoundError:
    print(f"Error: Log file not found at {log_file_path}")
    exit(1)
except Exception as e:
    print(f"Error reading file: {e}")
    exit(1)

if model_stats:
    table_data = []
    for model, stats in model_stats.items():
        avg_input = stats['total_prompt_tokens'] / stats['count']
        avg_output = stats['total_completion_tokens'] / stats['count']
        table_data.append([model, f"{avg_input:.2f}", f"{avg_output:.2f}", stats['count']])
    
    table_data.sort(key=lambda x: x[0])
    
    headers = ["Model Name", "Avg Input Tokens", "Avg Output Tokens", "Count"]
    print(tabulate(table_data, headers=headers, tablefmt="grid", numalign="right"))
    
    print(f"\nSummary: Processed {sum(stats['count'] for stats in model_stats.values())} entries")
    print(f"Found {len(model_stats)} different models")
    
else:
    print("No valid data found in the log file.")