[
    {
        "0": {
            "code_0": {
                "code": "import pandas as pd\nimport numpy as np\nimport torch\nimport torch.nn as nn\nimport torch.optim as optim\nfrom sklearn.model_selection import train_test_split\nfrom sklearn.preprocessing import StandardScaler, OneHotEncoder, PolynomialFeatures\nfrom torch.utils.data import DataLoader, TensorDataset\n\ndef data_loader(train_path: str, test_path: str):\n    # Load datasets using pandas\n    train_df = pd.read_excel(train_path)\n    test_df = pd.read_excel(test_path)\n\n    # Select relevant columns\n    relevant_columns = [\n        'x', 'y', 'Dominant Wave Direction',\n        'Breaker Wave Height Hb', 'Mean Grain Size'\n    ]\n    train_df = train_df[relevant_columns]\n    test_df = test_df[relevant_columns]\n\n    # Handle missing values\n    for column in train_df.columns:\n        if train_df[column].dtype == np.number:\n            train_df[column].fillna(train_df[column].mean(), inplace=True)\n            test_df[column].fillna(test_df[column].mean(), inplace=True)\n        else:\n            train_df[column].fillna(train_df[column].mode()[0], inplace=True)\n            test_df[column].fillna(test_df[column].mode()[0], inplace=True)\n\n    return train_df, test_df\n\ndef feature_engineering(df: pd.DataFrame):\n    # Encode categorical variables\n    ohe = OneHotEncoder(sparse=False)\n    wave_dir_encoded = ohe.fit_transform(df[['Dominant Wave Direction']])\n    \n    # Create polynomial features\n    poly = PolynomialFeatures(degree=2, include_bias=False)\n    x_poly = poly.fit_transform(df[['x']])\n\n    # Concatenate original with new features\n    df = df.drop(columns=['Dominant Wave Direction'])\n    df = pd.concat([\n        df.reset_index(drop=True),\n        pd.DataFrame(wave_dir_encoded, columns=ohe.get_feature_names_out(['Dominant Wave Direction'])),\n        pd.DataFrame(x_poly, columns=poly.get_feature_names_out(['x']))\n    ], axis=1)\n\n    return df\n\ndef preprocess_and_split(df: pd.DataFrame):\n    # Separate features and target\n    X = df.drop(columns=['y']).values\n    y = df['y'].values\n    \n    # Normalize features\n    scaler = StandardScaler()\n    X_scaled = scaler.fit_transform(X)\n\n    # Train-test split if necessary in preprocess_and_split\n    X_train, X_test, y_train, y_test = train_test_split(X_scaled, y, test_size=0.2, random_state=42)\n    \n    return X_train, X_test, y_train, y_test\n\ndef build_deep_learning_model(input_size: int, hidden_sizes: list):\n    # Define a simple feedforward neural network\n    class BeachProfileNet(nn.Module):\n        def __init__(self, input_size, hidden_sizes):\n            super(BeachProfileNet, self).__init__()\n            layers = []\n            last_size = input_size\n            for size in hidden_sizes:\n                layers.append(nn.Linear(last_size, size))\n                layers.append(nn.ReLU())\n                last_size = size\n            layers.append(nn.Linear(last_size, 1))  # output layer\n            self.network = nn.Sequential(*layers)\n        \n        def forward(self, x):\n            return self.network(x)\n    \n    # Create model\n    model = BeachProfileNet(input_size, hidden_sizes)\n    # Compile with MSE loss and Adam optimizer\n    optimizer = optim.Adam(model.parameters(), lr=0.001)\n    \n    return model, optimizer\n\ndef train_and_evaluate_model(model, optimizer, X_train, y_train, X_test, y_test):\n    # Convert data into PyTorch tensors\n    train_dataset = TensorDataset(torch.FloatTensor(X_train), torch.FloatTensor(y_train))\n    test_dataset = TensorDataset(torch.FloatTensor(X_test), torch.FloatTensor(y_test))\n\n    # Load data into DataLoaders\n    train_loader = DataLoader(train_dataset, batch_size=32, shuffle=True)\n    test_loader = DataLoader(test_dataset, batch_size=32, shuffle=False)\n\n    # Define loss function\n    criterion = nn.MSELoss()\n\n    # Train the model\n    for epoch in range(100):  # Train for 100 epochs\n        model.train()\n        for X_batch, y_batch in train_loader:\n            optimizer.zero_grad()\n            outputs = model(X_batch).squeeze()\n            loss = criterion(outputs, y_batch)\n            loss.backward()\n            optimizer.step()\n\n    # Evaluate the model\n    model.eval()\n    with torch.no_grad():\n        test_loss = 0\n        for X_batch, y_batch in test_loader:\n            outputs = model(X_batch).squeeze()\n            loss = criterion(outputs, y_batch)\n            test_loss += loss.item()\n\n    test_loss /= len(test_loader)\n    return test_loss\n\ndef main():\n    # File paths\n    train_path = \"beach_profile_data/processed_data/beachdata_train.xlsx\"\n    test_path = \"beach_profile_data/processed_data/beachdata_test.xlsx\"\n\n    # Load and preprocess data\n    train_df, test_df = data_loader(train_path, test_path)\n    train_df = feature_engineering(train_df)\n    test_df = feature_engineering(test_df)\n\n    # Preprocess and split\n    X_train, X_test, y_train, y_test = preprocess_and_split(train_df)\n\n    # Build the model\n    input_size = X_train.shape[1]\n    hidden_sizes = [64, 32]  # Example hidden layer sizes\n    model, optimizer = build_deep_learning_model(input_size, hidden_sizes)\n\n    # Train and evaluate the model\n    test_loss = train_and_evaluate_model(model, optimizer, X_train, y_train, X_test, y_test)\n\n    return test_loss",
                "plan": "The code workflow is established to facilitate a seamless pipeline from data loading to model evaluation:\n\n1. **Data Loading**: The `data_loader` function imports data from specified Excel files, extracts relevant columns, and handles missing values by applying imputation strategies.\n\n2. **Feature Engineering**: The `feature_engineering` function transforms the dataset by encoding categorical variables like 'Dominant Wave Direction' using one-hot encoding. It also generates polynomial features from continuous variables such as 'x', helping model complex relationships.\n\n3. **Preprocessing and Splitting**: This function normalizes the data using `StandardScaler` and splits it into train-test datasets, maintaining a suitable dataset structure for input into a neural network.\n\n4. **Model Building**: The `build_deep_learning_model` function designs a deep learning model using PyTorch. It specifies a neural network with user-defined hidden layer sizes and configures it using the Adam optimizer and Mean Squared Error loss.\n\n5. **Model Training and Evaluation**: The `train_and_evaluate_model` function constructs PyTorch datasets and dataloaders to manage training loops. The model is trained through successive epochs and evaluated on test data to return the average Mean Squared Error, gauging predictive performance.\n\nThis comprehensive plan addresses each guideline and requirement to construct an effective deep learning model suitable for coastal data analysis.",
                "main_function_name": "main",
                "score": 0.833516895535649,
                "pass_rate": 1.0,
                "pass_rate_score": 1.0,
                "prediction_score": 0.0,
                "pylint_score": 0.614,
                "radon_score": 0.72116895535649,
                "test_case_results": {
                    "runnability_check": {
                        "success": true,
                        "reason": null,
                        "message": "code is runnable"
                    }
                },
                "test_weights": {
                    "runnability_check": 0.07692307692307693
                }
            }
        }
    },
    {
        "0": {
            "code_0": {
                "code": "import pandas as pd\nimport numpy as np\nfrom sklearn.preprocessing import StandardScaler, OneHotEncoder\nfrom sklearn.compose import ColumnTransformer\nfrom sklearn.pipeline import Pipeline\nfrom torch import nn\nimport torch\nfrom torch.utils.data import DataLoader, TensorDataset\n\ndef load_and_preprocess_data():\n    # Load the datasets using pandas\n    train_data = pd.read_excel(\"beach_profile_data/processed_data/beachdata_train.xlsx\")\n    test_data = pd.read_excel(\"beach_profile_data/processed_data/beachdata_test.xlsx\")\n    \n    # Define relevant columns, including features and target\n    features = ['Annual Mean Period', 'Annual Mean Spring Tidal Range', \n                'Annual Mean Tidal Range', 'Breaker Wave Height Hb', \n                'Deep Water Wave Height Hd', 'Dimensionless Settling Velocity', \n                'High Tide Sediment Settling Velocity', 'Intertidal Slope', \n                'Kurtosis', 'Latitude', 'Longitude', 'Mean Grain Size', \n                'Mean Grain Size (Mz)', 'Mean Wave Height', 'Period', \n                'Profile Azimuth', 'Profile Length', 'Relative Tidal Range', \n                'Skewness', 'Sorting Coefficient', 'x']\n    \n    # Separate features and target variable\n    X_train = train_data[features]\n    y_train = train_data['y']\n    X_test = test_data[features]\n    y_test = test_data['y']\n    \n    # Preprocess the 'Dominant Wave Direction' feature (one-hot encoding)\n    preprocessor = ColumnTransformer(\n        transformers=[\n            ('num', StandardScaler(), features),\n            ('cat', OneHotEncoder(), ['Dominant Wave Direction'])\n        ])\n    \n    # Create the pipeline for preprocessing\n    X_train = preprocessor.fit_transform(train_data)\n    X_test = preprocessor.transform(test_data)\n    \n    return X_train, y_train, X_test, y_test\n\ndef apply_bruun_dean_models(dataframe):\n    # Bruun rule is generally linear, Dean model is power law (x^(2/3) relationship)\n    # Create initial predictions using the equations\n    dataframe['Bruun_Prediction'] = dataframe['x']  # Placeholder, usually needs a coefficient\n    dataframe['Dean_Prediction'] = dataframe['x'] ** (2 / 3)\n    return dataframe\n\ndef build_deep_learning_model(inputshape):\n    class SimpleMLP(nn.Module):\n        def __init__(self):\n            super(SimpleMLP, self).__init__()\n            self.fc1 = nn.Linear(inputshape, 64)\n            self.fc2 = nn.Linear(64, 32)\n            self.fc3 = nn.Linear(32, 1)\n            self.relu = nn.ReLU()\n        \n        def forward(self, x):\n            x = self.relu(self.fc1(x))\n            x = self.relu(self.fc2(x))\n            x = self.fc3(x)\n            return x\n    \n    model = SimpleMLP()\n    return model\n\ndef train_deep_learning_model(model, X_train, y_train):\n    # Prepare data loader for training\n    train_dataset = TensorDataset(torch.tensor(X_train, dtype=torch.float32), torch.tensor(y_train.values, dtype=torch.float32))\n    train_loader = DataLoader(train_dataset, batch_size=32, shuffle=True)\n    \n    # Initialize optimizer and loss function\n    criterion = nn.MSELoss()\n    optimizer = torch.optim.Adam(model.parameters(), lr=0.001)\n    \n    # Training loop\n    for epoch in range(100):  # Simple fixed number of epochs for illustration\n        for X_batch, y_batch in train_loader:\n            optimizer.zero_grad()\n            outputs = model(X_batch)\n            loss = criterion(outputs.flatten(), y_batch)\n            loss.backward()\n            optimizer.step()\n    \n    return model\n\ndef evaluate_deep_learning_model(model, X_test, y_test):\n    # Prepare data loader for testing\n    test_dataset = TensorDataset(torch.tensor(X_test, dtype=torch.float32), torch.tensor(y_test.values, dtype=torch.float32))\n    test_loader = DataLoader(test_dataset, batch_size=32, shuffle=False)\n    \n    # Set the model to evaluation mode\n    model.eval()\n    \n    # Initialize loss and performance metrics\n    criterion = nn.MSELoss()\n    total_loss = 0\n    \n    with torch.no_grad():\n        for X_batch, y_batch in test_loader:\n            outputs = model(X_batch)\n            loss = criterion(outputs.flatten(), y_batch)\n            total_loss += loss.item()\n    \n    average_loss = total_loss / len(test_loader)\n    results = {\n        \"Mean Squared Error\": average_loss,\n    }\n    return results\n\ndef main():\n    # Load and preprocess the data\n    X_train, y_train, X_test, y_test = load_and_preprocess_data()\n\n    # Load dataframe and apply the Bruun and Dean models\n    df_train = pd.DataFrame(X_train, columns=['x'] + list(range(X_train.shape[1] - 1)))\n    df_train = apply_bruun_dean_models(df_train)\n\n    # Build the deep learning model\n    model = build_deep_learning_model(X_train.shape[1])\n\n    # Train the model\n    trained_model = train_deep_learning_model(model, X_train, y_train)\n\n    # Evaluate the model\n    evaluation_results = evaluate_deep_learning_model(trained_model, X_test, y_test)\n\n    return evaluation_results",
                "plan": "1. **Load and Preprocess Data**: \n   - Utilize pandas to load the training and testing data from given paths.\n   - Select and process columns of interest including x, y, and categorical/numerical features.\n   - Preprocess features by scaling numerical columns and encoding 'Dominant Wave Direction'.\n\n2. **Apply Bruun and Dean Models**: \n   - Implement Bruun and Dean model equations to calculate initial predictions based on column 'x'.\n   - Attach prediction outputs as new columns in the dataset for comparison.\n\n3. **Build Deep Learning Model**: \n   - Construct a simple neural network using PyTorch with input features correlating to the preprocessed data.\n   - Design layers using common activation functions such as ReLU.\n\n4. **Train Deep Learning Model**: \n   - Prepare data for training, leveraging PyTorch data utilities for batching.\n   - Define optimizer and loss criteria, proceeding through iterative training over set epochs.\n\n5. **Evaluate Deep Learning Model**: \n   - Utilize the trained model on test data, gathering performance metrics.\n   - Return results like Mean Squared Error to quantify model accuracy and efficiency.\n\nEach component has distinct, logically ordered steps that guarantee proper data flow and functionality from loading data to final evaluation.",
                "main_function_name": "main",
                "score": 0.8147270026175669,
                "pass_rate": 1.0,
                "pass_rate_score": 1.0,
                "prediction_score": 0.0,
                "pylint_score": 0.446,
                "radon_score": 0.7012700261756699,
                "test_case_results": {
                    "runnability_check": {
                        "success": true,
                        "reason": null,
                        "message": "code is runnable"
                    }
                },
                "test_weights": {
                    "runnability_check": 0.038461538461538464
                }
            }
        }
    },
    {
        "0": {
            "code_0": {
                "code": "import pandas as pd\nimport torch\nimport torch.nn as nn\nfrom torch.utils.data import DataLoader, TensorDataset\nfrom sklearn.preprocessing import StandardScaler, OneHotEncoder\nfrom sklearn.metrics import mean_squared_error, r2_score\nimport numpy as np\nimport matplotlib.pyplot as plt\n\n# Component: load_data\ndef load_data(train_path: str, test_path: str):\n    # Load the training and testing datasets into Pandas DataFrames\n    train_df = pd.read_excel(train_path)\n    test_df = pd.read_excel(test_path)\n\n    return train_df, test_df\n\n# Component: preprocess_data\ndef preprocess_data(train_df, test_df):\n    # Encode 'Dominant Wave Direction' using one-hot encoding\n    encoder = OneHotEncoder(sparse=False)\n    encoded_train = encoder.fit_transform(train_df[['Dominant Wave Direction']])\n    encoded_test = encoder.transform(test_df[['Dominant Wave Direction']])\n    \n    # Drop original categorical column and add the encoded columns\n    train_df = train_df.drop('Dominant Wave Direction', axis=1)\n    test_df = test_df.drop('Dominant Wave Direction', axis=1)\n\n    ohe_columns = encoder.get_feature_names_out(['Dominant Wave Direction'])\n    train_df[ohe_columns] = encoded_train\n    test_df[ohe_columns] = encoded_test\n\n    # Standardize numerical features\n    scaler = StandardScaler()\n\n    # Identify numerical columns\n    numerical_cols = train_df.select_dtypes(include=['float64', 'int64']).columns.tolist()\n    \n    # Do not scale target variable 'y'\n    numerical_cols.remove('y')\n    \n    train_df[numerical_cols] = scaler.fit_transform(train_df[numerical_cols])\n    test_df[numerical_cols] = scaler.transform(test_df[numerical_cols])\n\n    return train_df, test_df\n\n# Component: feature_engineering\ndef feature_engineering(df):\n    # Calculate interaction terms such as 'Breaker Wave Height Hb' * 'Period'\n    df['Breaker_Height_Period'] = df['Breaker Wave Height Hb'] * df['Period']\n    \n    # Add any other features from domain knowledge as required\n\n    return df\n\n# Component: build_deep_learning_model\nclass BeachProfileModel(nn.Module):\n    def __init__(self, input_dim):\n        super(BeachProfileModel, self).__init__()\n        self.model = nn.Sequential(\n            nn.Linear(input_dim, 64),\n            nn.ReLU(),\n            nn.Linear(64, 32),\n            nn.ReLU(),\n            nn.Linear(32, 1)\n        )\n\n    def forward(self, x):\n        return self.model(x)\n\ndef build_deep_learning_model(input_dim):\n    # Instantiate the model\n    model = BeachProfileModel(input_dim=input_dim)\n    return model\n\n# Component: train_model\ndef train_model(model, train_df, x_train_tensor, y_train_tensor):\n    # Create DataLoader for training\n    train_dataset = TensorDataset(x_train_tensor, y_train_tensor)\n    train_loader = DataLoader(train_dataset, batch_size=32, shuffle=True)\n    \n    # Define loss function and optimizer\n    criterion = nn.MSELoss()\n    optimizer = torch.optim.Adam(model.parameters(), lr=0.001)\n    \n    # Train the model\n    epochs = 100\n    for epoch in range(epochs):\n        for x_batch, y_batch in train_loader:\n            optimizer.zero_grad()\n            outputs = model(x_batch)\n            loss = criterion(outputs.flatten(), y_batch)\n            loss.backward()\n            optimizer.step()\n\n    return model\n\n# Component: evaluate_model\ndef evaluate_model(model, test_df, x_test_tensor, y_test_tensor):\n    # Create DataLoader for testing\n    test_dataset = TensorDataset(x_test_tensor, y_test_tensor)\n    test_loader = DataLoader(test_dataset, batch_size=32, shuffle=False)\n    \n    # Gather predictions and true labels\n    model.eval()  # Set model to evaluation mode\n    predictions = []\n    actuals = []\n\n    with torch.no_grad():\n        for x_batch, y_batch in test_loader:\n            outputs = model(x_batch)\n            predictions.extend(outputs.flatten().numpy())\n            actuals.extend(y_batch.numpy())\n    \n    # Calculate metrics\n    rmse = np.sqrt(mean_squared_error(actuals, predictions))\n    r2 = r2_score(actuals, predictions)\n    \n    # Optional: Create a plot comparing actual vs. predicted\n    plt.scatter(actuals, predictions)\n    plt.xlabel('Actual Elevation')\n    plt.ylabel('Predicted Elevation')\n    plt.title('Actual vs Predicted Elevation')\n    plt.show()\n\n    return rmse, {'r2_score': r2, 'rmse': rmse}\n\n# Main Function\ndef coastal_profile_analysis(train_path: str, test_path: str):\n    # Load data\n    train_df, test_df = load_data(train_path, test_path)\n    \n    # Preprocess data\n    train_df, test_df = preprocess_data(train_df, test_df)\n    \n    # Perform feature engineering\n    train_df = feature_engineering(train_df)\n    test_df = feature_engineering(test_df)\n    \n    # Separate features and target\n    x_train = train_df.drop(columns='y').values\n    y_train = train_df['y'].values\n    x_test = test_df.drop(columns='y').values\n    y_test = test_df['y'].values\n\n    # Convert to PyTorch tensors\n    x_train_tensor = torch.tensor(x_train, dtype=torch.float32)\n    y_train_tensor = torch.tensor(y_train, dtype=torch.float32)\n    x_test_tensor = torch.tensor(x_test, dtype=torch.float32)\n    y_test_tensor = torch.tensor(y_test, dtype=torch.float32)\n    \n    # Build and train deep learning model\n    model = build_deep_learning_model(input_dim=x_train.shape[1])\n    trained_model = train_model(model, train_df, x_train_tensor, y_train_tensor)\n    \n    # Evaluate model\n    evaluation_results = evaluate_model(trained_model, test_df, x_test_tensor, y_test_tensor)\n    \n    return evaluation_results",
                "plan": "1. **Data Loading:** The function `load_data` loads both training and testing datasets using pandas, which facilitates easy manipulation and preprocessing.\n\n2. **Data Preprocessing:** \n   - The `preprocess_data` function encodes categorical variables using OneHotEncoder, transforming these into a format suitable for model consumption.\n   - StandardScaler is used to normalize numerical features to ensure that each numerical feature contributes equally to the training process. The target variable `'y'` is excluded from scaling.\n\n3. **Feature Engineering:** \n   - The `feature_engineering` function introduces interaction terms (like between 'Breaker Wave Height Hb' and 'Period') which can capture complex relationships not directly observed in individual features, aligning closely with domain knowledge about coastal processes.\n\n4. **Model Design and Construction:** \n   - Using PyTorch, a custom neural network as defined in `BeachProfileModel` approximates the regression relationship between input features and elevation. This network is instantiated in `build_deep_learning_model`.\n   - The architecture consists of fully connected layers with ReLU activation, standard for capturing non-linear relationships.\n\n5. **Model Training:** \n   - `train_model` involves training the deep learning model over a number of epochs, utilizing PyTorch's DataLoader for batching and an optimizer like Adam which adapts the learning rate during training.\n\n6. **Model Evaluation:** \n   - The `evaluate_model` function measures the model's accuracy using RMSE and R², and compares predictions with actual values from the test set.\n   - Visual comparison through plots provides insights into how well the model performs against actual coastal profiles.\n\n7. **Main Workflow:** \n   - All components are integrated in `coastal_profile_analysis`, forming a coherent workflow from data reading and preprocessing to feature engineering, model training, and evaluation, with a focus on input/output consistency and clarity.",
                "main_function_name": "coastal_profile_analysis",
                "score": 0.1440976588722404,
                "pass_rate": 0.0,
                "pass_rate_score": 0.0,
                "prediction_score": 0.0,
                "pylint_score": 0.6519999999999999,
                "radon_score": 0.7889765887224043,
                "test_case_results": {
                    "runnability_check": {
                        "success": false,
                        "reason": "test_failed",
                        "message": "code is not runnable, error: Traceback (most recent call last):\n  File \"<string>\", line 4, in test_function\nTypeError: coastal_profile_analysis() missing 2 required positional arguments: 'train_path' and 'test_path'\n"
                    }
                },
                "test_weights": {
                    "runnability_check": 0.023668639053254437
                }
            }
        },
        "1": {
            "code_0": {
                "code": "import pandas as pd\nimport torch\nimport torch.nn as nn\nfrom torch.utils.data import DataLoader, TensorDataset\nfrom sklearn.preprocessing import StandardScaler, OneHotEncoder\nfrom sklearn.metrics import mean_squared_error, r2_score\nimport numpy as np\nimport matplotlib.pyplot as plt\n\n# Component: load_data\ndef load_data(train_path: str, test_path: str):\n    \"\"\"Load the training and testing datasets from specified paths.\"\"\"\n    train_df = pd.read_excel(train_path)\n    test_df = pd.read_excel(test_path)\n    return train_df, test_df\n\n# Component: preprocess_data\ndef preprocess_data(train_df, test_df):\n    \"\"\"Encode categorical variables and standardize numerical features.\"\"\"\n    # Encode 'Dominant Wave Direction' using one-hot encoding\n    encoder = OneHotEncoder(sparse=False)\n    encoded_train = encoder.fit_transform(train_df[['Dominant Wave Direction']])\n    encoded_test = encoder.transform(test_df[['Dominant Wave Direction']])\n    \n    # Drop original categorical column and add the encoded columns\n    train_df = train_df.drop('Dominant Wave Direction', axis=1)\n    test_df = test_df.drop('Dominant Wave Direction', axis=1)\n\n    ohe_columns = encoder.get_feature_names_out(['Dominant Wave Direction'])\n    train_df[ohe_columns] = encoded_train\n    test_df[ohe_columns] = encoded_test\n\n    # Standardize numerical features\n    scaler = StandardScaler()\n\n    # Identify numerical columns\n    numerical_cols = train_df.select_dtypes(include=['float64', 'int64']).columns.tolist()\n    \n    # Do not scale target variable 'y'\n    numerical_cols.remove('y')\n    \n    train_df[numerical_cols] = scaler.fit_transform(train_df[numerical_cols])\n    test_df[numerical_cols] = scaler.transform(test_df[numerical_cols])\n\n    return train_df, test_df\n\n# Component: feature_engineering\ndef feature_engineering(df):\n    \"\"\"Create new features based on domain knowledge.\"\"\"\n    df['Breaker_Height_Period'] = df['Breaker Wave Height Hb'] * df['Period']\n    return df\n\n# Component: build_deep_learning_model\nclass BeachProfileModel(nn.Module):\n    \"\"\"Deep Learning Model for Profile Prediction.\"\"\"\n    def __init__(self, input_dim):\n        super(BeachProfileModel, self).__init__()\n        self.model = nn.Sequential(\n            nn.Linear(input_dim, 64),\n            nn.ReLU(),\n            nn.Linear(64, 32),\n            nn.ReLU(),\n            nn.Linear(32, 1)\n        )\n\n    def forward(self, x):\n        return self.model(x)\n\ndef build_deep_learning_model(input_dim):\n    # Instantiate the model\n    return BeachProfileModel(input_dim=input_dim)\n\n# Component: train_model\ndef train_model(model, x_train_tensor, y_train_tensor):\n    \"\"\"Train the model using the training data tensors.\"\"\"\n    train_dataset = TensorDataset(x_train_tensor, y_train_tensor)\n    train_loader = DataLoader(train_dataset, batch_size=32, shuffle=True)\n    \n    criterion = nn.MSELoss()\n    optimizer = torch.optim.Adam(model.parameters(), lr=0.001)\n    \n    epochs = 100\n    for epoch in range(epochs):\n        for x_batch, y_batch in train_loader:\n            optimizer.zero_grad()\n            outputs = model(x_batch)\n            loss = criterion(outputs.flatten(), y_batch)\n            loss.backward()\n            optimizer.step()\n\n    return model\n\n# Component: evaluate_model\ndef evaluate_model(model, x_test_tensor, y_test_tensor):\n    \"\"\"Evaluate the model using the test data tensors.\"\"\"\n    test_dataset = TensorDataset(x_test_tensor, y_test_tensor)\n    test_loader = DataLoader(test_dataset, batch_size=32, shuffle=False)\n    \n    model.eval()  # Set model to evaluation mode\n    predictions = []\n    actuals = []\n\n    with torch.no_grad():\n        for x_batch, y_batch in test_loader:\n            outputs = model(x_batch)\n            predictions.extend(outputs.flatten().numpy())\n            actuals.extend(y_batch.numpy())\n    \n    rmse = np.sqrt(mean_squared_error(actuals, predictions))\n    r2 = r2_score(actuals, predictions)\n    \n    plt.scatter(actuals, predictions)\n    plt.xlabel('Actual Elevation')\n    plt.ylabel('Predicted Elevation')\n    plt.title('Actual vs Predicted Elevation')\n    plt.show()\n\n    return rmse, {'r2_score': r2, 'rmse': rmse}\n\n# Main Function\ndef main():\n    \"\"\"Main function to execute the data processing and model analysis.\"\"\"\n    train_path = \"beach_profile_data/processed_data/beachdata_train.xlsx\"\n    test_path = \"beach_profile_data/processed_data/beachdata_test.xlsx\"\n    \n    train_df, test_df = load_data(train_path, test_path)\n    train_df, test_df = preprocess_data(train_df, test_df)\n    \n    train_df = feature_engineering(train_df)\n    test_df = feature_engineering(test_df)\n    \n    x_train = train_df.drop(columns='y').values\n    y_train = train_df['y'].values\n    x_test = test_df.drop(columns='y').values\n    y_test = test_df['y'].values\n\n    x_train_tensor = torch.tensor(x_train, dtype=torch.float32)\n    y_train_tensor = torch.tensor(y_train, dtype=torch.float32)\n    x_test_tensor = torch.tensor(x_test, dtype=torch.float32)\n    y_test_tensor = torch.tensor(y_test, dtype=torch.float32)\n    \n    model = build_deep_learning_model(input_dim=x_train.shape[1])\n    trained_model = train_model(model, x_train_tensor, y_train_tensor)\n    \n    evaluation_results = evaluate_model(trained_model, x_test_tensor, y_test_tensor)\n    return evaluation_results",
                "plan": "1. **Data Loading**: Read the train and test datasets from specified Excel file paths into Pandas DataFrames.\n\n2. **Preprocessing**: \n   - Encode categorical variables ('Dominant Wave Direction') using one-hot encoding.\n   - Standardize numeric features except for the target variable 'y' to ensure all features are on a similar scale.\n\n3. **Feature Engineering**: \n   - Enhance the dataset by engineering new features such as interactions between existing features to better capture underlying relationships.\n\n4. **Model Definition**: \n   - Define a neural network (NN) structure using PyTorch with layers appropriate for a regression task predicting elevation.\n\n5. **Training the Model**:\n   - Train the defined NN model using the processed training dataset, leveraging an optimizer and loss function suitable for regression.\n\n6. **Evaluating the Model**:\n   - Evaluate the trained model's predictive performance using test data by computing metrics like RMSE and R-squared.\n   - Visualize results through a scatter plot to compare actual vs. predicted values of elevation.\n\n7. **Execution via Main Function**:\n   - Integrate all steps in a self-contained `main()` function, ensuring no external input is needed, following the call of each component sequentially.",
                "main_function_name": "main",
                "score": 0.8496121594267091,
                "pass_rate": 1.0,
                "pass_rate_score": 1.0,
                "prediction_score": 0.0,
                "pylint_score": 0.778,
                "radon_score": 0.7181215942670918,
                "test_case_results": {
                    "runnability_check": {
                        "success": true,
                        "reason": null,
                        "message": "code is runnable"
                    }
                },
                "test_weights": {
                    "runnability_check": 0.023668639053254437
                }
            }
        }
    },
    {
        "0": {
            "code_0": {
                "code": "import pandas as pd\nimport numpy as np\nfrom sklearn.preprocessing import StandardScaler, OneHotEncoder\nfrom sklearn.model_selection import train_test_split, GridSearchCV\nfrom sklearn.neural_network import MLPRegressor\nfrom sklearn.metrics import mean_squared_error, mean_absolute_error\nfrom sklearn.pipeline import Pipeline\nfrom sklearn.compose import ColumnTransformer\n\ndef data_loader(train_path: str, test_path: str):\n    # Load training and testing data from Excel files\n    train_data = pd.read_excel(train_path)\n    test_data = pd.read_excel(test_path)\n    return train_data, test_data\n\ndef feature_engineering(data: pd.DataFrame):\n    # Separate features and target\n    X = data.drop(columns=['y'])\n    y = data['y']\n\n    # Encoding the 'Dominant Wave Direction' categorical feature using one-hot encoding\n    categorical_features = ['Dominant Wave Direction']\n    numerical_features = X.columns.difference(categorical_features)\n\n    # Building transformations for numerical and categorical features\n    numerical_transformer = StandardScaler()\n    categorical_transformer = OneHotEncoder(handle_unknown='ignore')\n\n    # Column transformer for applying transformations\n    preprocessor = ColumnTransformer(\n        transformers=[\n            ('num', numerical_transformer, numerical_features),\n            ('cat', categorical_transformer, categorical_features)\n        ]\n    )\n\n    # Apply transformations to the data\n    X = preprocessor.fit_transform(X)\n    \n    return X, y\n\ndef mathematical_model(data: pd.DataFrame):\n    # Applying Bruun Rule and Dean's Model to estimate sea level change\n    B = 1  # Placeholder for beach width, should be set based on domain knowledge\n    h = 1  # Placeholder for average sediment transport depth, should be set based on domain knowledge\n    A = 1  # Placeholder for Dean's scaling parameter\n    \n    # Calculate shoreline retreat and depth following Bruun and Dean's Models\n    shoreline_retreat = data['x'] / (B + h)  # Simplified example, replace with actual computation needed\n    beach_depth = A * np.power(data['x'], 2/3)\n\n    # Aggregate results to form a combined prediction\n    predictions = shoreline_retreat + beach_depth  # Simplified example\n    return predictions\n\ndef deep_learning_model(X_train, y_train):\n    # Define a simple MLP regressor model and set grid for hyperparameter search\n    model = MLPRegressor(random_state=42, max_iter=500)\n    param_grid = {\n        'hidden_layer_sizes': [(50, 50), (100,)],\n        'alpha': [0.0001, 0.001, 0.01],\n        'learning_rate_init': [0.001, 0.01]\n    }\n\n    # Using GridSearchCV to find the best model configuration\n    grid_search = GridSearchCV(model, param_grid, cv=5, scoring='neg_mean_squared_error', n_jobs=-1)\n    grid_search.fit(X_train, y_train)\n\n    return grid_search\n\ndef evaluation_and_prediction(trained_model, X_test, y_test):\n    # Use the trained model to make predictions on test data\n    predictions = trained_model.predict(X_test)\n\n    # Evaluate model performance using metrics\n    rmse = np.sqrt(mean_squared_error(y_test, predictions))\n    mae = mean_absolute_error(y_test, predictions)\n\n    print(f\"RMSE: {rmse}, MAE: {mae}\")\n\n    return predictions\n\ndef main():\n    # File paths for training and test data\n    train_path = \"beach_profile_data/processed_data/beachdata_train.xlsx\"\n    test_path = \"beach_profile_data/processed_data/beachdata_test.xlsx\"\n\n    # Step 1: Load data\n    train_data, test_data = data_loader(train_path, test_path)\n\n    # Step 2: Feature engineering on training data\n    X_train, y_train = feature_engineering(train_data)\n\n    # Step 3: Applying mathematical model - this can provide baseline predictions/insights\n    baseline_predictions = mathematical_model(train_data)\n\n    # Step 4: Building and training deep learning model\n    trained_model = deep_learning_model(X_train, y_train)\n\n    # Step 5: Feature engineering on test data\n    X_test, y_test = feature_engineering(test_data)\n\n    # Step 6: Evaluation and prediction on test data\n    predictions = evaluation_and_prediction(trained_model, X_test, y_test)\n\n    return predictions",
                "plan": "The code is structured to sequentially execute multiple tasks essential for modeling sea level change based on the Bruun and Dean models knowledge, and employing a deep learning approach to improve predictions.\n\n1. **Data Loading**: Uses pandas to load datasets from Excel files into DataFrames for manipulation.\n\n2. **Feature Engineering**: \n   - Encodes the categorical feature \"Dominant Wave Direction\" using OneHotEncoder.\n   - Scales numerical columns for uniform reference points using StandardScaler.\n   - Applies these transformations to both training and test datasets.\n\n3. **Mathematical Modeling**:\n   - Implements basic calculations using the principles from the Bruun and Dean models to create baseline predictions based solely on inputs such as 'x'.\n\n4. **Deep Learning Model**: \n   - Constructs a Multi-Layer Perceptron regressor and optimizes it using GridSearchCV for hyperparameter tuning.\n   - Uses a cross-validation approach for robust estimation of the best model.\n\n5. **Evaluation and Prediction**:\n   - Evaluates the trained model's performance through RMSE and MAE on the test dataset.\n   - Outputs these metrics and predictions to compare against baseline and understand model efficacy.\n\nThe main function orchestrates these steps, handling data paths defined as specified, without requiring any external input.",
                "main_function_name": "main",
                "score": 0.1336642355387246,
                "pass_rate": 0.0,
                "pass_rate_score": 0.0,
                "prediction_score": 0.0,
                "pylint_score": 0.558,
                "radon_score": 0.778642355387246,
                "test_case_results": {
                    "runnability_check": {
                        "success": false,
                        "reason": "timeout",
                        "message": "Process did not finish within the allowed time"
                    }
                },
                "test_weights": {
                    "runnability_check": 0.007100591715976331
                }
            }
        },
        "1": {
            "code_0": {
                "code": "import pandas as pd\nimport numpy as np\nfrom sklearn.preprocessing import StandardScaler, OneHotEncoder\nfrom sklearn.model_selection import train_test_split\nfrom sklearn.neural_network import MLPRegressor\nfrom sklearn.metrics import mean_squared_error, mean_absolute_error\nfrom sklearn.pipeline import Pipeline\nfrom sklearn.compose import ColumnTransformer\n\ndef data_loader(train_path: str, test_path: str):\n    \"\"\"Loads training and testing data from Excel files.\"\"\"\n    train_data = pd.read_excel(train_path)\n    test_data = pd.read_excel(test_path)\n    return train_data, test_data\n\ndef feature_engineering(data: pd.DataFrame):\n    \"\"\"Performs feature engineering, including encoding of categorical variables.\"\"\"\n    X = data.drop(columns=['y'])\n    y = data['y']\n\n    # Encoding the 'Dominant Wave Direction' categorical feature using one-hot encoding\n    categorical_features = ['Dominant Wave Direction']\n    numerical_features = X.columns.difference(categorical_features)\n\n    # Building transformations for numerical and categorical features\n    numerical_transformer = StandardScaler()\n    categorical_transformer = OneHotEncoder(handle_unknown='ignore')\n\n    # Column transformer for applying transformations\n    preprocessor = ColumnTransformer(\n        transformers=[\n            ('num', numerical_transformer, numerical_features),\n            ('cat', categorical_transformer, categorical_features)\n        ]\n    )\n\n    # Apply transformations to the data\n    X = preprocessor.fit_transform(X)\n    \n    return X, y\n\ndef mathematical_model(data: pd.DataFrame):\n    \"\"\"Applies the Bruun and Dean models to estimate sea level change.\"\"\"\n    B = 1  # Example placeholder\n    h = 1  # Example placeholder\n    A = 1  # Example placeholder\n    \n    # Implementing simplified versions of Bruun and Dean's Models\n    shoreline_retreat = data['x'] / (B + h)  # Example computation\n    beach_depth = A * np.power(data['x'], 2/3)\n\n    # Aggregate results to form a combined prediction\n    predictions = shoreline_retreat + beach_depth\n    return predictions\n\ndef deep_learning_model(X_train, y_train):\n    \"\"\"Builds and trains an MLPRegressor as a deep learning model.\"\"\"\n    # Define a simple MLP regressor model\n    model = MLPRegressor(hidden_layer_sizes=(50, 50), max_iter=300, random_state=42)\n\n    # Fit the model without grid search to save time\n    model.fit(X_train, y_train)\n\n    return model\n\ndef evaluation_and_prediction(trained_model, X_test, y_test):\n    \"\"\"Evaluates model performance and predicts the test dataset.\"\"\"\n    predictions = trained_model.predict(X_test)\n\n    # Evaluate model performance using metrics\n    rmse = np.sqrt(mean_squared_error(y_test, predictions))\n    mae = mean_absolute_error(y_test, predictions)\n\n    print(f\"RMSE: {rmse}, MAE: {mae}\")\n\n    return predictions\n\ndef main():\n    # File paths for training and test data\n    train_path = \"beach_profile_data/processed_data/beachdata_train.xlsx\"\n    test_path = \"beach_profile_data/processed_data/beachdata_test.xlsx\"\n\n    # Step 1: Load data\n    train_data, test_data = data_loader(train_path, test_path)\n\n    # Step 2: Feature engineering on training data\n    X_train, y_train = feature_engineering(train_data)\n\n    # Step 3: Applying mathematical model\n    baseline_predictions = mathematical_model(train_data)\n\n    # Step 4: Building and training deep learning model\n    trained_model = deep_learning_model(X_train, y_train)\n\n    # Step 5: Feature engineering on test data\n    X_test, y_test = feature_engineering(test_data)\n\n    # Step 6: Evaluate and predict on test data\n    predictions = evaluation_and_prediction(trained_model, X_test, y_test)\n\n    return predictions",
                "plan": "1. **Data Loading**: \n   - Utilize `pandas` to load train and test datasets from Excel files. Ensure the paths are correctly pointing to the specified file locations.\n   \n2. **Feature Engineering**:\n   - Drop the target column `y` from the dataset to prepare feature data `X`.\n   - Encode categorical feature `Dominant Wave Direction` using one-hot encoding for proper handling by neural networks.\n   - Standardize numerical features to ensure equal treatment in the model.\n\n3. **Mathematical Model**:\n   - Implement simplified Bruun and Dean models to estimate changes in sea level.\n   - Calculate predictions for shoreline retreat and depth for baseline understanding.\n\n4. **Deep Learning Model**:\n   - Create a Multi-Layer Perceptron (MLP) Regressor without hyperparameter grid search to streamline execution.\n   - Train on the engineered features using the `fit` method.\n\n5. **Evaluation and Prediction**:\n   - Use the trained model to predict on test data.\n   - Evaluate predictions via RMSE and MAE metrics to gain performance insights.\n\n6. **Integration and Execution**:\n   - The `main()` function integrates all components ensuring a cohesive workflow from data loading to model evaluation.",
                "main_function_name": "main",
                "score": 0.14543093545400454,
                "pass_rate": 0.0,
                "pass_rate_score": 0.0,
                "prediction_score": 0.0,
                "pylint_score": 0.6799999999999999,
                "radon_score": 0.7743093545400456,
                "test_case_results": {
                    "runnability_check": {
                        "success": false,
                        "reason": "test_failed",
                        "message": "code is not runnable, error: Traceback (most recent call last):\n  File \"<string>\", line 4, in test_function\n  File \"<string>\", line 99, in main\n  File \"<string>\", line 68, in evaluation_and_prediction\n  File \"d:\\anaconda3\\envs\\llm\\lib\\site-packages\\sklearn\\neural_network\\_multilayer_perceptron.py\", line 1599, in predict\n    return self._predict(X)\n  File \"d:\\anaconda3\\envs\\llm\\lib\\site-packages\\sklearn\\neural_network\\_multilayer_perceptron.py\", line 1603, in _predict\n    y_pred = self._forward_pass_fast(X, check_input=check_input)\n  File \"d:\\anaconda3\\envs\\llm\\lib\\site-packages\\sklearn\\neural_network\\_multilayer_perceptron.py\", line 207, in _forward_pass_fast\n    X = self._validate_data(X, accept_sparse=[\"csr\", \"csc\"], reset=False)\n  File \"d:\\anaconda3\\envs\\llm\\lib\\site-packages\\sklearn\\base.py\", line 626, in _validate_data\n    self._check_n_features(X, reset=reset)\n  File \"d:\\anaconda3\\envs\\llm\\lib\\site-packages\\sklearn\\base.py\", line 415, in _check_n_features\n    raise ValueError(\nValueError: X has 27 features, but MLPRegressor is expecting 28 features as input.\n"
                    }
                },
                "test_weights": {
                    "runnability_check": 0.00109239872553482
                }
            }
        },
        "2": {
            "code_0": {
                "code": "import pandas as pd\nimport numpy as np\nfrom sklearn.preprocessing import StandardScaler, OneHotEncoder\nfrom sklearn.model_selection import train_test_split\nfrom sklearn.neural_network import MLPRegressor\nfrom sklearn.metrics import mean_squared_error, mean_absolute_error\nfrom sklearn.pipeline import Pipeline\nfrom sklearn.compose import ColumnTransformer\n\ndef data_loader(train_path: str, test_path: str):\n    \"\"\"Loads training and testing data from Excel files.\"\"\"\n    train_data = pd.read_excel(train_path)\n    test_data = pd.read_excel(test_path)\n    return train_data, test_data\n\ndef feature_engineering(train_data: pd.DataFrame, test_data: pd.DataFrame):\n    \"\"\"Performs feature engineering, including encoding of categorical variables.\"\"\"\n    X_train = train_data.drop(columns=['y'])\n    y_train = train_data['y']\n    X_test = test_data.drop(columns=['y'])\n    y_test = test_data['y']\n\n    # Define categorical and numerical columns\n    categorical_features = ['Dominant Wave Direction']\n    numerical_features = X_train.columns.difference(categorical_features)\n\n    # Define transformers for preprocessing\n    numerical_transformer = StandardScaler()\n    categorical_transformer = OneHotEncoder(handle_unknown='ignore')\n\n    # Define column transformer\n    preprocessor = ColumnTransformer(\n        transformers=[\n            ('num', numerical_transformer, numerical_features),\n            ('cat', categorical_transformer, categorical_features)\n        ]\n    )\n\n    # Fit only on the training data and transform both\n    X_train_transformed = preprocessor.fit_transform(X_train)\n    X_test_transformed = preprocessor.transform(X_test)\n    \n    return X_train_transformed, y_train, X_test_transformed, y_test\n\ndef mathematical_model(data: pd.DataFrame):\n    \"\"\"Applies the Bruun and Dean models to estimate sea level change.\"\"\"\n    B = 1  # Placeholder\n    h = 1  # Placeholder\n    A = 1  # Placeholder\n    \n    # Implementing simplified versions of Bruun and Dean's Models\n    shoreline_retreat = data['x'] / (B + h)  # Example computation\n    beach_depth = A * np.power(data['x'], 2/3)\n\n    # Aggregate results to form a combined prediction\n    predictions = shoreline_retreat + beach_depth\n    return predictions\n\ndef deep_learning_model(X_train, y_train):\n    \"\"\"Builds and trains an MLPRegressor as a deep learning model.\"\"\"\n    # Define a simple MLP regressor model\n    model = MLPRegressor(hidden_layer_sizes=(50, 50), max_iter=300, random_state=42)\n\n    # Fit the model\n    model.fit(X_train, y_train)\n\n    return model\n\ndef evaluation_and_prediction(trained_model, X_test, y_test):\n    \"\"\"Evaluates model performance and predicts the test dataset.\"\"\"\n    predictions = trained_model.predict(X_test)\n\n    # Evaluate model performance using metrics\n    rmse = np.sqrt(mean_squared_error(y_test, predictions))\n    mae = mean_absolute_error(y_test, predictions)\n\n    print(f\"RMSE: {rmse}, MAE: {mae}\")\n\n    return predictions\n\ndef main():\n    # File paths for training and test data\n    train_path = \"beach_profile_data/processed_data/beachdata_train.xlsx\"\n    test_path = \"beach_profile_data/processed_data/beachdata_test.xlsx\"\n\n    # Step 1: Load data\n    train_data, test_data = data_loader(train_path, test_path)\n\n    # Step 2: Feature engineering to ensure consistent feature space\n    X_train, y_train, X_test, y_test = feature_engineering(train_data, test_data)\n\n    # Step 3: Optionally apply the mathematical model for initial insights\n    baseline_predictions = mathematical_model(train_data)\n\n    # Step 4: Build and train the deep learning model\n    trained_model = deep_learning_model(X_train, y_train)\n\n    # Step 5: Evaluate and predict on test data\n    predictions = evaluation_and_prediction(trained_model, X_test, y_test)\n\n    return predictions",
                "plan": "1. **Data Loading**:\n   - Define a function `data_loader()` to load data from specified Excel files for both training and testing datasets.\n\n2. **Feature Engineering**:\n   - Define `feature_engineering()` to handle feature preprocessing such as scaling numeric values and one-hot encoding categorical features.\n   - Ensure the column transformer is fit on training data only and then transform both training and test data to maintain consistency in features.\n\n3. **Mathematical Modeling**:\n   - Implement `mathematical_model()` to apply simplified Bruun and Dean models for rough predictions based on domain knowledge.\n\n4. **Deep Learning Model**:\n   - Define `deep_learning_model()` to build, train, and return an `MLPRegressor` used as a neural network.\n\n5. **Model Evaluation**:\n   - Define `evaluation_and_prediction()` to evaluate model predictions using RMSE and MAE.\n\n6. **Main Function**:\n   - Integrate all components in `main()` function, ensuring all workflows are connected, and evaluate performance.",
                "main_function_name": "main",
                "score": 0.8419623605533706,
                "pass_rate": 1.0,
                "pass_rate_score": 1.0,
                "prediction_score": 0.0,
                "pylint_score": 0.654,
                "radon_score": 0.7656236055337062,
                "test_case_results": {
                    "runnability_check": {
                        "success": true,
                        "reason": null,
                        "message": "code is runnable"
                    }
                },
                "test_weights": {
                    "runnability_check": 0.00109239872553482
                }
            }
        }
    },
    {
        "0": {
            "code_0": {
                "code": "import pandas as pd\nimport numpy as np\nimport torch\nfrom torch import nn, optim\nfrom sklearn.preprocessing import OneHotEncoder, StandardScaler\nfrom sklearn.metrics import mean_squared_error\nfrom torch.utils.data import DataLoader, TensorDataset\n\n# Load data component\ndef load_data(training_file_path: str, test_file_path: str):\n    # Read data from the Excel files\n    train_data = pd.read_excel(training_file_path)\n    test_data = pd.read_excel(test_file_path)\n    return train_data, test_data\n\n# Preprocess data component\ndef preprocess_data(data: pd.DataFrame):\n    # Identify and isolate the categorical column 'Dominant Wave Direction'\n    encoder = OneHotEncoder(sparse=False)\n    encoded_wave_direction = encoder.fit_transform(data[['Dominant Wave Direction']])\n    \n    # Remove the original categorical column and replace it with the encoded columns\n    data = data.drop('Dominant Wave Direction', axis=1)\n    encoded_columns = pd.DataFrame(encoded_wave_direction, index=data.index, columns=encoder.get_feature_names_out())\n    data = pd.concat([data, encoded_columns], axis=1)\n    \n    # Normalize numerical features using standard scaling\n    scaler = StandardScaler()\n    numerical_features = data.drop(['y'], axis=1)  # Exclude target variable 'y' from normalization\n    scaled_features = scaler.fit_transform(numerical_features)\n    \n    # Combine scaled features with target variable\n    processed_data = pd.DataFrame(scaled_features, columns=numerical_features.columns)\n    processed_data['y'] = data['y'].values\n    return processed_data\n\n# Calculate Bruun Retraction\ndef calculate_bruun_retraction(sea_level_rise: float, cross_shore_distance: float, closure_depth: float, active_profile_height: float):\n    # Compute shoreline retraction using Bruun equation\n    R = (sea_level_rise * cross_shore_distance) / (closure_depth + active_profile_height)\n    return R\n\n# Calculate Dean Profile\ndef calculate_dean_profile(distance: float, scale_parameter: float):\n    # Compute beach profile elevation using Dean profile\n    elevation = scale_parameter * distance**(2/3)\n    return elevation\n\n# Build deep learning model component\ndef build_deep_learning_model(input_dim: int, output_dim: int):\n    # Define a simple feed-forward neural network model using PyTorch\n    class BeachProfileNet(nn.Module):\n        def __init__(self):\n            super(BeachProfileNet, self).__init__()\n            self.layer1 = nn.Linear(input_dim, 64)\n            self.layer2 = nn.Linear(64, 32)\n            self.layer3 = nn.Linear(32, output_dim)\n            self.relu = nn.ReLU()\n\n        def forward(self, x):\n            x = self.relu(self.layer1(x))\n            x = self.relu(self.layer2(x))\n            x = self.layer3(x)\n            return x\n    \n    model = BeachProfileNet()\n    return model\n\n# Train and evaluate model component\ndef train_and_evaluate_model(model: nn.Module, training_data: pd.DataFrame, testing_data: pd.DataFrame, epochs: int, learning_rate: float):\n    # Prepare data loaders\n    X_train = torch.tensor(training_data.drop('y', axis=1).values, dtype=torch.float32)\n    y_train = torch.tensor(training_data['y'].values, dtype=torch.float32).view(-1, 1)\n    \n    X_test = torch.tensor(testing_data.drop('y', axis=1).values, dtype=torch.float32)\n    y_test = torch.tensor(testing_data['y'].values, dtype=torch.float32).view(-1, 1)\n    \n    train_dataset = TensorDataset(X_train, y_train)\n    train_loader = DataLoader(train_dataset, batch_size=32, shuffle=True)\n    \n    # Define loss function and optimizer\n    criterion = nn.MSELoss()\n    optimizer = optim.Adam(model.parameters(), lr=learning_rate)\n    \n    # Training loop\n    for epoch in range(epochs):\n        model.train()\n        for X_batch, y_batch in train_loader:\n            optimizer.zero_grad()\n            predictions = model(X_batch)\n            loss = criterion(predictions, y_batch)\n            loss.backward()\n            optimizer.step()\n    \n    # Evaluation\n    model.eval()\n    with torch.no_grad():\n        predictions = model(X_test)\n        test_loss = mean_squared_error(y_test, predictions)\n    \n    # Return evaluation metrics\n    return {\"mean_squared_error\": test_loss}\n\n# Main function integrating all components\ndef main(training_file_path: str, test_file_path: str):\n    # Step 1: Load data\n    train_data, test_data = load_data(training_file_path, test_file_path)\n    \n    # Step 2: Preprocess data\n    processed_train_data = preprocess_data(train_data)\n    processed_test_data = preprocess_data(test_data)\n    \n    # Step 3: Initialize model\n    input_dimensions = processed_train_data.shape[1] - 1  # subtract 1 for target variable\n    output_dimensions = 1\n    model = build_deep_learning_model(input_dimensions, output_dimensions)\n    \n    # Step 4: Train and Evaluate model\n    results = train_and_evaluate_model(model, processed_train_data, processed_test_data, epochs=10, learning_rate=0.001)\n    \n    # Return results\n    return results",
                "plan": "The code integrates several steps to handle the training and evaluation of a deep learning model for beach profile data. Here's a detailed breakdown:\n\n1. **Loading Data**: \n   - The `load_data` function reads training and test datasets from Excel files and returns them as pandas DataFrames.\n   \n2. **Preprocessing Data**:\n   - The `preprocess_data` function encodes the 'Dominant Wave Direction' categorical feature using one-hot encoding and scales numerical features using standard scaling, excluding the target variable 'y'.\n   \n3. **Bruun and Dean Calculations**:\n   - `calculate_bruun_retraction` applies the Bruun model equation to calculate shoreline retraction as per the specified parameters.\n   - `calculate_dean_profile` calculates beach profile elevation using the Dean model equation for provided parameters.\n   \n4. **Building the Model**:\n   - The `build_deep_learning_model` defines a PyTorch model class `BeachProfileNet`. The model consists of fully connected layers with ReLU activations for non-linear transformation.\n   \n5. **Training and Evaluation**:\n   - The `train_and_evaluate_model` function uses the given model along with training and test datasets. It sets up data loaders, defines the loss function, and uses an optimizer to train the model over several epochs. The evaluation is performed using mean-squared error to assess the model’s performance on the test dataset.\n   \n6. **Integration**:\n   - Finally, the `main` function integrates all steps by loading the data, preprocessing, initializing the model, and training & evaluating the model, returning the evaluation results.\n\nThis step-by-step organization ensures all necessary components are implemented and used correctly within the entire process flow, maintaining clarity and functionality in the code.",
                "main_function_name": "main",
                "score": 0.12126514252858656,
                "pass_rate": 0.0,
                "pass_rate_score": 0.0,
                "prediction_score": 0.0,
                "pylint_score": 0.493,
                "radon_score": 0.7196514252858655,
                "test_case_results": {
                    "runnability_check": {
                        "success": false,
                        "reason": "test_failed",
                        "message": "code is not runnable, error: Traceback (most recent call last):\n  File \"<string>\", line 4, in test_function\nTypeError: main() missing 2 required positional arguments: 'training_file_path' and 'test_file_path'\n"
                    }
                },
                "test_weights": {
                    "runnability_check": 0.007100591715976331
                }
            }
        },
        "1": {
            "code_0": {
                "code": "import pandas as pd\nimport numpy as np\nimport torch\nfrom torch import nn, optim\nfrom sklearn.preprocessing import OneHotEncoder, StandardScaler\nfrom sklearn.metrics import mean_squared_error\nfrom torch.utils.data import DataLoader, TensorDataset\n\n# Load data component\ndef load_data():\n    training_file_path = \"beach_profile_data/processed_data/beachdata_train.xlsx\"\n    test_file_path = \"beach_profile_data/processed_data/beachdata_test.xlsx\"\n    \n    # Read data from the Excel files\n    train_data = pd.read_excel(training_file_path)\n    test_data = pd.read_excel(test_file_path)\n    return train_data, test_data\n\n# Preprocess data component\ndef preprocess_data(data: pd.DataFrame):\n    # Identify and isolate the categorical column 'Dominant Wave Direction'\n    encoder = OneHotEncoder(sparse_output=False)\n    encoded_wave_direction = encoder.fit_transform(data[['Dominant Wave Direction']])\n    \n    # Remove the original categorical column and replace it with the encoded columns\n    data = data.drop('Dominant Wave Direction', axis=1)\n    encoded_columns = pd.DataFrame(encoded_wave_direction, index=data.index, columns=encoder.get_feature_names_out())\n    data = pd.concat([data, encoded_columns], axis=1)\n    \n    # Normalize numerical features using standard scaling\n    scaler = StandardScaler()\n    numerical_features = data.drop(['y'], axis=1)  # Exclude target variable 'y' from normalization\n    scaled_features = scaler.fit_transform(numerical_features)\n    \n    # Combine scaled features with target variable\n    processed_data = pd.DataFrame(scaled_features, columns=numerical_features.columns)\n    processed_data['y'] = data['y'].values\n    return processed_data\n\n# Calculate Bruun Retraction\ndef calculate_bruun_retraction(sea_level_rise: float, cross_shore_distance: float, closure_depth: float, active_profile_height: float):\n    # Compute shoreline retraction using the Bruun equation\n    R = (sea_level_rise * cross_shore_distance) / (closure_depth + active_profile_height)\n    return R\n\n# Calculate Dean Profile\ndef calculate_dean_profile(distance: float, scale_parameter: float):\n    # Compute beach profile elevation using the Dean profile\n    elevation = scale_parameter * distance**(2/3)\n    return elevation\n\n# Build deep learning model component\ndef build_deep_learning_model(input_dim: int, output_dim: int):\n    # Define a simple feed-forward neural network model using PyTorch\n    class BeachProfileNet(nn.Module):\n        def __init__(self):\n            super(BeachProfileNet, self).__init__()\n            self.layer1 = nn.Linear(input_dim, 64)\n            self.layer2 = nn.Linear(64, 32)\n            self.layer3 = nn.Linear(32, output_dim)\n            self.relu = nn.ReLU()\n\n        def forward(self, x):\n            x = self.relu(self.layer1(x))\n            x = self.relu(self.layer2(x))\n            x = self.layer3(x)\n            return x\n    \n    model = BeachProfileNet()\n    return model\n\n# Train and evaluate model component\ndef train_and_evaluate_model(model: nn.Module, training_data: pd.DataFrame, testing_data: pd.DataFrame, epochs: int, learning_rate: float):\n    # Prepare data loaders\n    X_train = torch.tensor(training_data.drop('y', axis=1).values, dtype=torch.float32)\n    y_train = torch.tensor(training_data['y'].values, dtype=torch.float32).view(-1, 1)\n    \n    X_test = torch.tensor(testing_data.drop('y', axis=1).values, dtype=torch.float32)\n    y_test = torch.tensor(testing_data['y'].values, dtype=torch.float32).view(-1, 1)\n    \n    train_dataset = TensorDataset(X_train, y_train)\n    train_loader = DataLoader(train_dataset, batch_size=32, shuffle=True)\n    \n    # Define loss function and optimizer\n    criterion = nn.MSELoss()\n    optimizer = optim.Adam(model.parameters(), lr=learning_rate)\n    \n    # Training loop\n    for epoch in range(epochs):\n        model.train()\n        for X_batch, y_batch in train_loader:\n            optimizer.zero_grad()\n            predictions = model(X_batch)\n            loss = criterion(predictions, y_batch)\n            loss.backward()\n            optimizer.step()\n    \n    # Evaluation\n    model.eval()\n    with torch.no_grad():\n        predictions = model(X_test)\n        test_loss = mean_squared_error(y_test, predictions.numpy())\n    \n    # Return evaluation metrics\n    return {\"mean_squared_error\": test_loss}\n\n# Main function integrating all components\ndef main():\n    # Step 1: Load data\n    train_data, test_data = load_data()\n    \n    # Step 2: Preprocess data\n    processed_train_data = preprocess_data(train_data)\n    processed_test_data = preprocess_data(test_data)\n    \n    # Step 3: Initialize model\n    input_dimensions = processed_train_data.shape[1] - 1  # subtract 1 for target variable\n    output_dimensions = 1\n    model = build_deep_learning_model(input_dimensions, output_dimensions)\n    \n    # Step 4: Train and Evaluate model\n    results = train_and_evaluate_model(model, processed_train_data, processed_test_data, epochs=10, learning_rate=0.001)\n    \n    # Return results\n    return results",
                "plan": "1. **Load Data**: Use `pandas` to load the training and test datasets from predefined file paths. This provides a foundation to work with for both the input features and the target variable.\n\n2. **Preprocess Data**: Convert categorical columns like \"Dominant Wave Direction\" to numerical form using one-hot encoding, allowing them to be processed by machine learning algorithms. Then, scale numerical features to give them similar ranges, which can improve model training.\n\n3. **Calculate Bruun Retraction (optional feature)**: Define a method to compute shoreline retraction using the Bruun rule. This was part of the user guidance but isn't directly used in model training or prediction.\n\n4. **Calculate Dean Profile (optional feature)**: Similarly, define a method to compute the Dean profile. Like the Bruun Retraction, it's part of the theoretical framework but isn't directly used in the model.\n\n5. **Build Deep Learning Model**: Define a simple feed-forward neural network using PyTorch to predict the target variable `y`. The network architecture includes fully connected layers with ReLU activations.\n\n6. **Train and Evaluate Model**: Use the preprocessed data to train this model. Perform evaluation to calculate metrics such as mean squared error on the test data to quantify the model's accuracy.\n\n7. **Main Function**: The function `main()` orchestrates these steps: it loads data, preprocesses it, initializes the model, trains it, evaluates it, and returns the performance metrics. This integrated logic allows execution without input arguments.",
                "main_function_name": "main",
                "score": 0.12096252217320436,
                "pass_rate": 0.0,
                "pass_rate_score": 0.0,
                "prediction_score": 0.0,
                "pylint_score": 0.49400000000000005,
                "radon_score": 0.7156252217320436,
                "test_case_results": {
                    "runnability_check": {
                        "success": false,
                        "reason": "test_failed",
                        "message": "code is not runnable, error: Traceback (most recent call last):\n  File \"<string>\", line 4, in test_function\n  File \"<string>\", line 122, in main\n  File \"<string>\", line 101, in train_and_evaluate_model\n  File \"d:\\anaconda3\\envs\\llm\\lib\\site-packages\\torch\\nn\\modules\\module.py\", line 1532, in _wrapped_call_impl\n    return self._call_impl(*args, **kwargs)\n  File \"d:\\anaconda3\\envs\\llm\\lib\\site-packages\\torch\\nn\\modules\\module.py\", line 1541, in _call_impl\n    return forward_call(*args, **kwargs)\n  File \"<string>\", line 64, in forward\n  File \"d:\\anaconda3\\envs\\llm\\lib\\site-packages\\torch\\nn\\modules\\module.py\", line 1532, in _wrapped_call_impl\n    return self._call_impl(*args, **kwargs)\n  File \"d:\\anaconda3\\envs\\llm\\lib\\site-packages\\torch\\nn\\modules\\module.py\", line 1541, in _call_impl\n    return forward_call(*args, **kwargs)\n  File \"d:\\anaconda3\\envs\\llm\\lib\\site-packages\\torch\\nn\\modules\\linear.py\", line 116, in forward\n    return F.linear(input, self.weight, self.bias)\nRuntimeError: mat1 and mat2 shapes cannot be multiplied (242x27 and 28x64)\n"
                    }
                },
                "test_weights": {
                    "runnability_check": 0.001
                }
            }
        },
        "2": {
            "code_0": {
                "code": "import pandas as pd\nimport numpy as np\nimport torch\nfrom torch import nn, optim\nfrom sklearn.preprocessing import OneHotEncoder, StandardScaler\nfrom sklearn.metrics import mean_squared_error\nfrom torch.utils.data import DataLoader, TensorDataset\n\n# Load data component\ndef load_data():\n    training_file_path = \"beach_profile_data/processed_data/beachdata_train.xlsx\"\n    test_file_path = \"beach_profile_data/processed_data/beachdata_test.xlsx\"\n    \n    # Read data from the Excel files\n    train_data = pd.read_excel(training_file_path)\n    test_data = pd.read_excel(test_file_path)\n    return train_data, test_data\n\n# Preprocess data component\ndef preprocess_data(data: pd.DataFrame):\n    # Identify and isolate the categorical column 'Dominant Wave Direction'\n    encoder = OneHotEncoder(sparse_output=False)\n    encoded_wave_direction = encoder.fit_transform(data[['Dominant Wave Direction']])\n    \n    # Remove the original categorical column and replace it with the encoded columns\n    data = data.drop('Dominant Wave Direction', axis=1)\n    encoded_columns = pd.DataFrame(encoded_wave_direction, index=data.index, columns=encoder.get_feature_names_out())\n    data = pd.concat([data, encoded_columns], axis=1)\n    \n    # Normalize numerical features using standard scaling\n    scaler = StandardScaler()\n    numerical_features = data.drop(['y'], axis=1)  # Exclude target variable 'y' from normalization\n    scaled_features = scaler.fit_transform(numerical_features)\n    \n    # Combine scaled features with target variable\n    processed_data = pd.DataFrame(scaled_features, columns=numerical_features.columns)\n    processed_data['y'] = data['y'].values\n    return processed_data\n\n# Calculate Bruun Retraction\ndef calculate_bruun_retraction(sea_level_rise: float, cross_shore_distance: float, closure_depth: float, active_profile_height: float):\n    # Compute shoreline retraction using the Bruun equation\n    R = (sea_level_rise * cross_shore_distance) / (closure_depth + active_profile_height)\n    return R\n\n# Calculate Dean Profile\ndef calculate_dean_profile(distance: float, scale_parameter: float):\n    # Compute beach profile elevation using the Dean profile\n    elevation = scale_parameter * distance**(2/3)\n    return elevation\n\n# Build deep learning model component\ndef build_deep_learning_model(input_dim: int, output_dim: int):\n    # Define a simple feed-forward neural network model using PyTorch\n    class BeachProfileNet(nn.Module):\n        def __init__(self):\n            super(BeachProfileNet, self).__init__()\n            self.layer1 = nn.Linear(input_dim, 64)\n            self.layer2 = nn.Linear(64, 32)\n            self.layer3 = nn.Linear(32, output_dim)\n            self.relu = nn.ReLU()\n\n        def forward(self, x):\n            x = self.relu(self.layer1(x))\n            x = self.relu(self.layer2(x))\n            x = self.layer3(x)\n            return x\n    \n    model = BeachProfileNet()\n    return model\n\n# Train and evaluate model component\ndef train_and_evaluate_model(model: nn.Module, training_data: pd.DataFrame, testing_data: pd.DataFrame, epochs: int, learning_rate: float):\n    # Prepare data loaders\n    X_train = torch.tensor(training_data.drop('y', axis=1).values, dtype=torch.float32)\n    y_train = torch.tensor(training_data['y'].values, dtype=torch.float32).view(-1, 1)\n    \n    X_test = torch.tensor(testing_data.drop('y', axis=1).values, dtype=torch.float32)\n    y_test = torch.tensor(testing_data['y'].values, dtype=torch.float32).view(-1, 1)\n\n    train_dataset = TensorDataset(X_train, y_train)\n    train_loader = DataLoader(train_dataset, batch_size=32, shuffle=True)\n    \n    # Define loss function and optimizer\n    criterion = nn.MSELoss()\n    optimizer = optim.Adam(model.parameters(), lr=learning_rate)\n    \n    # Training loop\n    for epoch in range(epochs):\n        model.train()\n        for X_batch, y_batch in train_loader:\n            optimizer.zero_grad()\n            predictions = model(X_batch)\n            loss = criterion(predictions, y_batch)\n            loss.backward()\n            optimizer.step()\n    \n    # Evaluation\n    model.eval()\n    with torch.no_grad():\n        predictions = model(X_test)\n        test_loss = mean_squared_error(y_test, predictions.numpy())\n    \n    # Return evaluation metrics\n    return {\"mean_squared_error\": test_loss}\n\n# Main function integrating all components\ndef main():\n    # Step 1: Load data\n    train_data, test_data = load_data()\n    \n    # Step 2: Preprocess data\n    processed_train_data = preprocess_data(train_data)\n    processed_test_data = preprocess_data(test_data)\n    \n    # Step 3: Initialize model\n    input_dimensions = processed_train_data.shape[1] - 1  # subtract 1 for target variable\n    output_dimensions = 1\n    model = build_deep_learning_model(input_dimensions, output_dimensions)\n    \n    # Step 4: Train and Evaluate model\n    results = train_and_evaluate_model(model, processed_train_data, processed_test_data, epochs=10, learning_rate=0.001)\n    \n    # Return results\n    return results",
                "plan": "1. **Load Data**:\n   - The `load_data` function reads training and test datasets from Excel files using pandas.\n\n2. **Preprocess Data**:\n   - Categorical feature \"Dominant Wave Direction\" is encoded using `OneHotEncoder` to convert it into numerical form suitable for ML models.\n   - Numerical features are normalized using `StandardScaler` to ensure they have a standard distribution.\n\n3. **Bruun and Dean Models**:\n   - Functions `calculate_bruun_retraction` and `calculate_dean_profile` provide mathematical calculations based on the Bruun and Dean models, which are separately implemented from the deep learning model.\n\n4. **Deep Learning Model**\n   - A feed-forward neural network model is created using PyTorch, consisting of three layers with ReLU activation functions in between.\n\n5. **Train and Evaluate Model**:\n   - Data is converted to PyTorch tensors, and a `DataLoader` is used for batch processing during training.\n   - The model is trained for a defined number of epochs, optimizing the mean squared error loss using the Adam optimizer.\n   - After training, the model is evaluated on the test data, and the mean squared error is used as the evaluation metric.\n\n6. **Main Function**:\n   - Integrates all previous steps into a cohesive workflow that loads data, preprocesses it, builds a model, and then trains and evaluates the model.",
                "main_function_name": "main",
                "score": 0.12216252217320436,
                "pass_rate": 0.0,
                "pass_rate_score": 0.0,
                "prediction_score": 0.0,
                "pylint_score": 0.506,
                "radon_score": 0.7156252217320436,
                "test_case_results": {
                    "runnability_check": {
                        "success": false,
                        "reason": "test_failed",
                        "message": "code is not runnable, error: Traceback (most recent call last):\n  File \"<string>\", line 4, in test_function\n  File \"<string>\", line 122, in main\n  File \"<string>\", line 101, in train_and_evaluate_model\n  File \"d:\\anaconda3\\envs\\llm\\lib\\site-packages\\torch\\nn\\modules\\module.py\", line 1532, in _wrapped_call_impl\n    return self._call_impl(*args, **kwargs)\n  File \"d:\\anaconda3\\envs\\llm\\lib\\site-packages\\torch\\nn\\modules\\module.py\", line 1541, in _call_impl\n    return forward_call(*args, **kwargs)\n  File \"<string>\", line 64, in forward\n  File \"d:\\anaconda3\\envs\\llm\\lib\\site-packages\\torch\\nn\\modules\\module.py\", line 1532, in _wrapped_call_impl\n    return self._call_impl(*args, **kwargs)\n  File \"d:\\anaconda3\\envs\\llm\\lib\\site-packages\\torch\\nn\\modules\\module.py\", line 1541, in _call_impl\n    return forward_call(*args, **kwargs)\n  File \"d:\\anaconda3\\envs\\llm\\lib\\site-packages\\torch\\nn\\modules\\linear.py\", line 116, in forward\n    return F.linear(input, self.weight, self.bias)\nRuntimeError: mat1 and mat2 shapes cannot be multiplied (242x27 and 28x64)\n"
                    }
                },
                "test_weights": {
                    "runnability_check": 0.001
                }
            }
        },
        "3": {
            "code_0": {
                "code": "import pandas as pd\nimport numpy as np\nimport torch\nfrom torch import nn, optim\nfrom sklearn.preprocessing import OneHotEncoder, StandardScaler\nfrom sklearn.metrics import mean_squared_error\nfrom torch.utils.data import DataLoader, TensorDataset\n\n# Load data component\ndef load_data():\n    training_file_path = \"beach_profile_data/processed_data/beachdata_train.xlsx\"\n    test_file_path = \"beach_profile_data/processed_data/beachdata_test.xlsx\"\n    \n    # Read data from the Excel files\n    train_data = pd.read_excel(training_file_path)\n    test_data = pd.read_excel(test_file_path)\n    return train_data, test_data\n\n# Preprocess data component\ndef preprocess_data(data: pd.DataFrame):\n    # Identify and isolate the categorical column 'Dominant Wave Direction'\n    encoder = OneHotEncoder(sparse_output=False)\n    encoded_wave_direction = encoder.fit_transform(data[['Dominant Wave Direction']])\n    \n    # Remove the original categorical column and replace it with the encoded columns\n    data = data.drop('Dominant Wave Direction', axis=1)\n    encoded_columns = pd.DataFrame(encoded_wave_direction, index=data.index, columns=encoder.get_feature_names_out())\n    data = pd.concat([data, encoded_columns], axis=1)\n    \n    # Normalize numerical features using standard scaling\n    scaler = StandardScaler()\n    # Drop target variable 'y' from normalization\n    numerical_features = data.drop(['y'], axis=1)\n    scaled_features = scaler.fit_transform(numerical_features)\n    \n    # Combine scaled features with target variable\n    processed_data = pd.DataFrame(scaled_features, columns=numerical_features.columns)\n    processed_data['y'] = data['y'].values\n    return processed_data\n\n# Calculate Bruun Retraction\ndef calculate_bruun_retraction(sea_level_rise: float, cross_shore_distance: float, closure_depth: float, active_profile_height: float):\n    # Compute shoreline retraction using the Bruun equation\n    R = (sea_level_rise * cross_shore_distance) / (closure_depth + active_profile_height)\n    return R\n\n# Calculate Dean Profile\ndef calculate_dean_profile(distance: float, scale_parameter: float):\n    # Compute beach profile elevation using the Dean profile\n    elevation = scale_parameter * distance**(2/3)\n    return elevation\n\n# Build deep learning model component\ndef build_deep_learning_model(input_dim: int, output_dim: int):\n    # Define a simple feed-forward neural network model using PyTorch\n    class BeachProfileNet(nn.Module):\n        def __init__(self):\n            super(BeachProfileNet, self).__init__()\n            self.layer1 = nn.Linear(input_dim, 64)\n            self.layer2 = nn.Linear(64, 32)\n            self.layer3 = nn.Linear(32, output_dim)\n            self.relu = nn.ReLU()\n\n        def forward(self, x):\n            x = self.relu(self.layer1(x))\n            x = self.relu(self.layer2(x))\n            x = self.layer3(x)\n            return x\n    \n    model = BeachProfileNet()\n    return model\n\n# Train and evaluate model component\ndef train_and_evaluate_model(model: nn.Module, training_data: pd.DataFrame, testing_data: pd.DataFrame, epochs: int, learning_rate: float):\n    # Prepare data loaders\n    X_train = torch.tensor(training_data.drop('y', axis=1).values, dtype=torch.float32)\n    y_train = torch.tensor(training_data['y'].values, dtype=torch.float32).view(-1, 1)\n    \n    X_test = torch.tensor(testing_data.drop('y', axis=1).values, dtype=torch.float32)\n    y_test = torch.tensor(testing_data['y'].values, dtype=torch.float32).view(-1, 1)\n\n    train_dataset = TensorDataset(X_train, y_train)\n    train_loader = DataLoader(train_dataset, batch_size=32, shuffle=True)\n    \n    # Define loss function and optimizer\n    criterion = nn.MSELoss()\n    optimizer = optim.Adam(model.parameters(), lr=learning_rate)\n    \n    # Training loop\n    for epoch in range(epochs):\n        model.train()\n        for X_batch, y_batch in train_loader:\n            optimizer.zero_grad()\n            predictions = model(X_batch)\n            loss = criterion(predictions, y_batch)\n            loss.backward()\n            optimizer.step()\n    \n    # Evaluation\n    model.eval()\n    with torch.no_grad():\n        predictions = model(X_test)\n        test_loss = mean_squared_error(y_test, predictions.numpy())\n    \n    # Return evaluation metrics\n    return {\"mean_squared_error\": test_loss}\n\n# Main function integrating all components\ndef main():\n    # Step 1: Load data\n    train_data, test_data = load_data()\n    \n    # Step 2: Preprocess data\n    processed_train_data = preprocess_data(train_data)\n    processed_test_data = preprocess_data(test_data)\n    \n    # Step 3: Initialize model with correct input dimension\n    input_dimensions = processed_train_data.shape[1] - 1  # subtract 1 for target variable\n    output_dimensions = 1\n    model = build_deep_learning_model(input_dimensions, output_dimensions)\n    \n    # Step 4: Train and Evaluate model\n    results = train_and_evaluate_model(model, processed_train_data, processed_test_data, epochs=10, learning_rate=0.001)\n    \n    # Return results\n    return results",
                "plan": "1. **Load Data**: The script loads the training and test datasets from specified Excel file paths using Pandas.\n   \n2. **Preprocess Data**: It preprocesses the data by one-hot encoding the categorical 'Dominant Wave Direction' and standardizing numerical features. Both datasets are preprocessed similarly to ensure consistent feature dimensions.\n\n3. **Build Deep Learning Model**: A simple feed-forward neural network (BeachProfileNet) is defined using PyTorch. The network includes three linear layers with ReLU activations.\n\n4. **Train and Evaluate Model**: The script converts preprocessed data into tensors, uses a DataLoader for batching, defines a loss function (MSE), and the Adam optimizer for training. It trains the model over specified epochs, evaluates test data, and computes the mean-squared error.\n\n5. **Main Function**: The main function ties together data loading, preprocessing, model building, training, evaluation, and returns the performance metrics.",
                "main_function_name": "main",
                "score": 0.12216252217320436,
                "pass_rate": 0.0,
                "pass_rate_score": 0.0,
                "prediction_score": 0.0,
                "pylint_score": 0.506,
                "radon_score": 0.7156252217320436,
                "test_case_results": {
                    "runnability_check": {
                        "success": false,
                        "reason": "test_failed",
                        "message": "code is not runnable, error: Traceback (most recent call last):\n  File \"<string>\", line 4, in test_function\n  File \"<string>\", line 123, in main\n  File \"<string>\", line 102, in train_and_evaluate_model\n  File \"d:\\anaconda3\\envs\\llm\\lib\\site-packages\\torch\\nn\\modules\\module.py\", line 1532, in _wrapped_call_impl\n    return self._call_impl(*args, **kwargs)\n  File \"d:\\anaconda3\\envs\\llm\\lib\\site-packages\\torch\\nn\\modules\\module.py\", line 1541, in _call_impl\n    return forward_call(*args, **kwargs)\n  File \"<string>\", line 65, in forward\n  File \"d:\\anaconda3\\envs\\llm\\lib\\site-packages\\torch\\nn\\modules\\module.py\", line 1532, in _wrapped_call_impl\n    return self._call_impl(*args, **kwargs)\n  File \"d:\\anaconda3\\envs\\llm\\lib\\site-packages\\torch\\nn\\modules\\module.py\", line 1541, in _call_impl\n    return forward_call(*args, **kwargs)\n  File \"d:\\anaconda3\\envs\\llm\\lib\\site-packages\\torch\\nn\\modules\\linear.py\", line 116, in forward\n    return F.linear(input, self.weight, self.bias)\nRuntimeError: mat1 and mat2 shapes cannot be multiplied (242x27 and 28x64)\n"
                    }
                },
                "test_weights": {
                    "runnability_check": 0.001
                }
            }
        },
        "4": {
            "code_0": {
                "code": "import pandas as pd\nimport numpy as np\nimport torch\nfrom torch import nn, optim\nfrom sklearn.preprocessing import OneHotEncoder, StandardScaler\nfrom sklearn.metrics import mean_squared_error\nfrom torch.utils.data import DataLoader, TensorDataset\n\n# Load data component\ndef load_data():\n    training_file_path = \"beach_profile_data/processed_data/beachdata_train.xlsx\"\n    test_file_path = \"beach_profile_data/processed_data/beachdata_test.xlsx\"\n    \n    # Read data from the Excel files\n    train_data = pd.read_excel(training_file_path)\n    test_data = pd.read_excel(test_file_path)\n    return train_data, test_data\n\n# Preprocess data component\ndef preprocess_data(data: pd.DataFrame):\n    # Identify and isolate the categorical column 'Dominant Wave Direction'\n    encoder = OneHotEncoder(sparse_output=False)\n    encoded_wave_direction = encoder.fit_transform(data[['Dominant Wave Direction']])\n    \n    # Remove the original categorical column and replace it with the encoded columns\n    data = data.drop('Dominant Wave Direction', axis=1)\n    encoded_columns = pd.DataFrame(encoded_wave_direction, index=data.index, columns=encoder.get_feature_names_out())\n    data = pd.concat([data, encoded_columns], axis=1)\n    \n    # Normalize numerical features using standard scaling\n    scaler = StandardScaler()\n    # Drop target variable 'y' from normalization\n    numerical_features = data.drop(['y'], axis=1)\n    scaled_features = scaler.fit_transform(numerical_features)\n    \n    # Combine scaled features with target variable\n    processed_data = pd.DataFrame(scaled_features, columns=numerical_features.columns)\n    processed_data['y'] = data['y'].values\n    return processed_data\n\n# Calculate Bruun Retraction\ndef calculate_bruun_retraction(sea_level_rise: float, cross_shore_distance: float, closure_depth: float, active_profile_height: float):\n    # Compute shoreline retraction using the Bruun equation\n    R = (sea_level_rise * cross_shore_distance) / (closure_depth + active_profile_height)\n    return R\n\n# Calculate Dean Profile\ndef calculate_dean_profile(distance: float, scale_parameter: float):\n    # Compute beach profile elevation using the Dean profile\n    elevation = scale_parameter * distance**(2/3)\n    return elevation\n\n# Build deep learning model component\ndef build_deep_learning_model(input_dim: int, output_dim: int):\n    # Define a simple feed-forward neural network model using PyTorch\n    class BeachProfileNet(nn.Module):\n        def __init__(self):\n            super(BeachProfileNet, self).__init__()\n            self.layer1 = nn.Linear(input_dim, 64)\n            self.layer2 = nn.Linear(64, 32)\n            self.layer3 = nn.Linear(32, output_dim)\n            self.relu = nn.ReLU()\n\n        def forward(self, x):\n            x = self.relu(self.layer1(x))\n            x = self.relu(self.layer2(x))\n            x = self.layer3(x)\n            return x\n    \n    model = BeachProfileNet()\n    return model\n\n# Train and evaluate model component\ndef train_and_evaluate_model(model: nn.Module, training_data: pd.DataFrame, testing_data: pd.DataFrame, epochs: int, learning_rate: float):\n    # Prepare data loaders\n    X_train = torch.tensor(training_data.drop('y', axis=1).values, dtype=torch.float32)\n    y_train = torch.tensor(training_data['y'].values, dtype=torch.float32).view(-1, 1)\n    \n    X_test = torch.tensor(testing_data.drop('y', axis=1).values, dtype=torch.float32)\n    y_test = torch.tensor(testing_data['y'].values, dtype=torch.float32).view(-1, 1)\n\n    train_dataset = TensorDataset(X_train, y_train)\n    train_loader = DataLoader(train_dataset, batch_size=32, shuffle=True)\n    \n    # Define loss function and optimizer\n    criterion = nn.MSELoss()\n    optimizer = optim.Adam(model.parameters(), lr=learning_rate)\n    \n    # Training loop\n    for epoch in range(epochs):\n        model.train()\n        for X_batch, y_batch in train_loader:\n            optimizer.zero_grad()\n            predictions = model(X_batch)\n            loss = criterion(predictions, y_batch)\n            loss.backward()\n            optimizer.step()\n    \n    # Evaluation\n    model.eval()\n    with torch.no_grad():\n        predictions = model(X_test)\n        test_loss = mean_squared_error(y_test, predictions.numpy())\n    \n    # Return evaluation metrics\n    return {\"mean_squared_error\": test_loss}\n\n# Main function integrating all components\ndef main():\n    # Step 1: Load data\n    train_data, test_data = load_data()\n    \n    # Step 2: Preprocess data\n    processed_train_data = preprocess_data(train_data)\n    processed_test_data = preprocess_data(test_data)\n    \n    # Step 3: Initialize model with correct input dimension\n    input_dimensions = processed_train_data.shape[1] - 1  # subtract 1 for target variable\n    output_dimensions = 1\n    model = build_deep_learning_model(input_dimensions, output_dimensions)\n    \n    # Step 4: Train and Evaluate model\n    results = train_and_evaluate_model(model, processed_train_data, processed_test_data, epochs=10, learning_rate=0.001)\n    \n    # Return results\n    return results",
                "plan": "1. **Data Loading**: \n   - Load the training and test datasets from the specified Excel file paths.\n   - Return the loaded datasets for further processing.\n\n2. **Data Preprocessing**: \n   - Encode the categorical 'Dominant Wave Direction' column using one-hot encoding to convert it into numerical format.\n   - Normalize numerical features except the target variable 'y' using standard scaling to improve convergence during training.\n   - Ensure all encoded and scaled features combined with the target variable form the final processed dataset.\n\n3. **Bruun and Dean Calculations**: \n   - Implement mathematical functions for calculating shoreline retreat using the Bruun Rule and profile elevation using the Dean Model. These functions provide insights into feature engineering.\n\n4. **Model Building**: \n   - Construct a neural network using PyTorch with an input layer, two hidden layers, and an output layer with ReLU activations in between.\n\n5. **Model Training and Evaluation**: \n   - Split the dataset into features and target variable.\n   - Convert data into PyTorch tensors and use a DataLoader for batched training.\n   - Define the loss function and optimizer, followed by a training loop over specified epochs.\n   - Evaluate the model using mean squared error on the test dataset.\n\n6. **Integration and Execution**: \n   - Combine all steps in a single main function that loads the data, preprocesses it, builds and trains the model, then evaluates its performance.\n\nThis plan ensures that the code remains modular, maintainable, and integrates all components correctly.",
                "main_function_name": "main",
                "score": 0.12216252217320436,
                "pass_rate": 0.0,
                "pass_rate_score": 0.0,
                "prediction_score": 0.0,
                "pylint_score": 0.506,
                "radon_score": 0.7156252217320436,
                "test_case_results": {
                    "runnability_check": {
                        "success": false,
                        "reason": "test_failed",
                        "message": "code is not runnable, error: Traceback (most recent call last):\n  File \"<string>\", line 4, in test_function\n  File \"<string>\", line 123, in main\n  File \"<string>\", line 102, in train_and_evaluate_model\n  File \"d:\\anaconda3\\envs\\llm\\lib\\site-packages\\torch\\nn\\modules\\module.py\", line 1532, in _wrapped_call_impl\n    return self._call_impl(*args, **kwargs)\n  File \"d:\\anaconda3\\envs\\llm\\lib\\site-packages\\torch\\nn\\modules\\module.py\", line 1541, in _call_impl\n    return forward_call(*args, **kwargs)\n  File \"<string>\", line 65, in forward\n  File \"d:\\anaconda3\\envs\\llm\\lib\\site-packages\\torch\\nn\\modules\\module.py\", line 1532, in _wrapped_call_impl\n    return self._call_impl(*args, **kwargs)\n  File \"d:\\anaconda3\\envs\\llm\\lib\\site-packages\\torch\\nn\\modules\\module.py\", line 1541, in _call_impl\n    return forward_call(*args, **kwargs)\n  File \"d:\\anaconda3\\envs\\llm\\lib\\site-packages\\torch\\nn\\modules\\linear.py\", line 116, in forward\n    return F.linear(input, self.weight, self.bias)\nRuntimeError: mat1 and mat2 shapes cannot be multiplied (242x27 and 28x64)\n"
                    }
                },
                "test_weights": {
                    "runnability_check": 0.001
                }
            }
        }
    },
    {
        "0": {
            "code_0": {
                "code": "import pandas as pd\nimport numpy as np\nfrom sklearn.preprocessing import MinMaxScaler, OneHotEncoder\nfrom sklearn.metrics import mean_squared_error, mean_absolute_error\nimport torch\nimport torch.nn as nn\nimport torch.optim as optim\n\ndef load_and_preprocess_data(train_path, test_path):\n    # Load datasets\n    train_df = pd.read_excel(train_path)\n    test_df = pd.read_excel(test_path)\n\n    # One-hot encoding for the categorical 'Dominant Wave Direction' column\n    one_hot_encoder = OneHotEncoder(sparse=False)\n    train_encoded = one_hot_encoder.fit_transform(train_df[['Dominant Wave Direction']])\n    test_encoded = one_hot_encoder.transform(test_df[['Dominant Wave Direction']])\n\n    # Normalizing numerical features\n    numerical_cols = train_df.select_dtypes(include=[np.float64, np.int64]).columns\n    scaler = MinMaxScaler()\n    train_df[numerical_cols] = scaler.fit_transform(train_df[numerical_cols])\n    test_df[numerical_cols] = scaler.transform(test_df[numerical_cols])\n\n    # Preparing input features and target variable\n    train_features = np.concatenate((train_df[numerical_cols].values, train_encoded), axis=1)\n    train_targets = train_df['y'].values\n\n    test_features = np.concatenate((test_df[numerical_cols].values, test_encoded), axis=1)\n    test_targets = test_df['y'].values\n\n    return {'features': train_features, 'targets': train_targets}, {'features': test_features, 'targets': test_targets}\n\ndef calculate_bruun_parameters(sea_level_rise, profile_width, berm_height, depth_closure, features):\n    bruun_params = (sea_level_rise * profile_width) / (berm_height + depth_closure)\n    return [param + bruun_params for param in features]\n\ndef calculate_dean_parameters(x, shape_param):\n    return [shape_param * dist**(2/3) for dist in x]\n\ndef build_and_train_model(train_data, test_data):\n    # Setting up the neural network architecture with PyTorch\n    class MLPModel(nn.Module):\n        def __init__(self, input_size):\n            super(MLPModel, self).__init__()\n            self.hidden = nn.Sequential(\n                nn.Linear(input_size, 64),\n                nn.ReLU(),\n                nn.Linear(64, 32),\n                nn.ReLU(),\n                nn.Linear(32, 1)  # Single output because it's regression\n            )\n        \n        def forward(self, x):\n            return self.hidden(x)\n\n    train_features = torch.tensor(train_data['features'], dtype=torch.float32)\n    train_targets = torch.tensor(train_data['targets'], dtype=torch.float32).view(-1, 1)\n\n    model = MLPModel(train_features.shape[1])\n    criterion = nn.MSELoss()\n    optimizer = optim.Adam(model.parameters(), lr=0.001)\n\n    # Training loop\n    for epoch in range(100):\n        model.train()\n        optimizer.zero_grad()\n        outputs = model(train_features)\n        loss = criterion(outputs, train_targets)\n        loss.backward()\n        optimizer.step()\n    \n    return model\n\ndef evaluate_model(model, test_data):\n    model.eval()\n    test_features = torch.tensor(test_data['features'], dtype=torch.float32)\n\n    with torch.no_grad():\n        predictions = model(test_features).numpy().flatten()\n\n    rmse = np.sqrt(mean_squared_error(test_data['targets'], predictions))\n    mae = mean_absolute_error(test_data['targets'], predictions)\n\n    return rmse, mae\n\ndef main():\n    train_path = \"beach_profile_data/processed_data/beachdata_train.xlsx\"\n    test_path = \"beach_profile_data/processed_data/beachdata_test.xlsx\"\n\n    train_data, test_data = load_and_preprocess_data(train_path, test_path)\n    \n    sea_level_rise = 0.3  # Example value\n    profile_width = 400   # Example value\n    berm_height = 2       # Example value\n    depth_closure = 10    # Example value\n\n    # Calculating additional features via Bruun and Dean models\n    bruun_params = calculate_bruun_parameters(sea_level_rise, profile_width, berm_height, depth_closure, train_data['features'])\n    dean_params = calculate_dean_parameters(train_data['features'][:, 0], 0.1)  # Example shape parameter\n\n    # Incorporate additional features\n    train_data['features'] = np.column_stack([train_data['features'], bruun_params, dean_params])\n    test_data['features'] = np.column_stack([test_data['features'], bruun_params, dean_params])\n\n    # Build, train, and evaluate the model\n    model = build_and_train_model(train_data, test_data)\n    rmse, mae = evaluate_model(model, test_data)\n\n    return rmse, mae",
                "plan": "1. **Data Loading and Preprocessing**:\n   - Load the training and testing datasets from specified Excel files.\n   - Apply one-hot encoding to the 'Dominant Wave Direction' column to convert categorical data into numerical format.\n   - Normalize the numerical columns using Min-Max scaling for uniformity in training.\n\n2. **Feature Engineering with Bruun and Dean Models**:\n   - Compute additional features using formulas from the Bruun and Dean models.\n   - These additional features help in capturing domain-specific interactions for better prediction accuracy.\n\n3. **Model Construction and Training**:\n   - Define a Multilayer Perceptron (MLP) using PyTorch for regression purposes.\n   - Compile the model, employ a loss function (MSE), and use the Adam optimizer.\n   - Train the model using the prepared training data.\n\n4. **Model Evaluation**:\n   - Evaluate the trained model on testing data.\n   - Calculate performance metrics RMSE and MAE to assess prediction accuracy and error rates.\n\n5. **Integration**:\n   - Bring all components together in the `main` function, which executes the entire workflow from data processing to evaluation.",
                "main_function_name": "main",
                "score": 0.13823320306816306,
                "pass_rate": 0.0,
                "pass_rate_score": 0.0,
                "prediction_score": 0.0,
                "pylint_score": 0.7,
                "radon_score": 0.6823320306816307,
                "test_case_results": {
                    "runnability_check": {
                        "success": false,
                        "reason": "test_failed",
                        "message": "code is not runnable, error: Traceback (most recent call last):\n  File \"<string>\", line 4, in test_function\n  File \"<string>\", line 104, in main\n  File \"d:\\anaconda3\\envs\\llm\\lib\\site-packages\\numpy\\lib\\shape_base.py\", line 652, in column_stack\n    return _nx.concatenate(arrays, 1)\nValueError: all the input array dimensions except for the concatenation axis must match exactly, but along dimension 0, the array at index 0 has size 242 and the array at index 1 has size 536\n"
                    }
                },
                "test_weights": {
                    "runnability_check": 0.001
                }
            }
        },
        "1": {
            "code_0": {
                "code": "import pandas as pd\nimport numpy as np\nfrom sklearn.preprocessing import MinMaxScaler, OneHotEncoder\nfrom sklearn.metrics import mean_squared_error, mean_absolute_error\nimport torch\nimport torch.nn as nn\nimport torch.optim as optim\n\ndef load_and_preprocess_data(train_path, test_path):\n    # Load datasets\n    train_df = pd.read_excel(train_path)\n    test_df = pd.read_excel(test_path)\n\n    # One-hot encoding for the categorical 'Dominant Wave Direction' column\n    one_hot_encoder = OneHotEncoder(sparse=False)\n    train_encoded = one_hot_encoder.fit_transform(train_df[['Dominant Wave Direction']])\n    test_encoded = one_hot_encoder.transform(test_df[['Dominant Wave Direction']])\n\n    # Normalizing numerical features\n    numerical_cols = train_df.select_dtypes(include=[np.float64, np.int64]).columns\n    scaler = MinMaxScaler()\n    train_df[numerical_cols] = scaler.fit_transform(train_df[numerical_cols])\n    test_df[numerical_cols] = scaler.transform(test_df[numerical_cols])\n\n    # Preparing input features and target variable\n    train_features = np.concatenate((train_df[numerical_cols].values, train_encoded), axis=1)\n    train_targets = train_df['y'].values\n\n    test_features = np.concatenate((test_df[numerical_cols].values, test_encoded), axis=1)\n    test_targets = test_df['y'].values\n\n    return {'features': train_features, 'targets': train_targets}, {'features': test_features, 'targets': test_targets}\n\ndef calculate_bruun_parameters(sea_level_rise, profile_width, berm_height, depth_closure, features):\n    bruun_params = (sea_level_rise * profile_width) / (berm_height + depth_closure)\n    return np.full((features.shape[0], 1), bruun_params)\n\ndef calculate_dean_parameters(x, shape_param):\n    return shape_param * x**(2/3)\n\ndef build_and_train_model(train_data, test_data):\n    # Setting up the neural network architecture with PyTorch\n    class MLPModel(nn.Module):\n        def __init__(self, input_size):\n            super(MLPModel, self).__init__()\n            self.hidden = nn.Sequential(\n                nn.Linear(input_size, 64),\n                nn.ReLU(),\n                nn.Linear(64, 32),\n                nn.ReLU(),\n                nn.Linear(32, 1)  # Single output because it's regression\n            )\n        \n        def forward(self, x):\n            return self.hidden(x)\n\n    train_features = torch.tensor(train_data['features'], dtype=torch.float32)\n    train_targets = torch.tensor(train_data['targets'], dtype=torch.float32).view(-1, 1)\n\n    model = MLPModel(train_features.shape[1])\n    criterion = nn.MSELoss()\n    optimizer = optim.Adam(model.parameters(), lr=0.001)\n\n    # Training loop\n    for epoch in range(100):\n        model.train()\n        optimizer.zero_grad()\n        outputs = model(train_features)\n        loss = criterion(outputs, train_targets)\n        loss.backward()\n        optimizer.step()\n    \n    return model\n\ndef evaluate_model(model, test_data):\n    model.eval()\n    test_features = torch.tensor(test_data['features'], dtype=torch.float32)\n\n    with torch.no_grad():\n        predictions = model(test_features).numpy().flatten()\n\n    rmse = np.sqrt(mean_squared_error(test_data['targets'], predictions))\n    mae = mean_absolute_error(test_data['targets'], predictions)\n\n    return rmse, mae\n\ndef main():\n    train_path = \"beach_profile_data/processed_data/beachdata_train.xlsx\"\n    test_path = \"beach_profile_data/processed_data/beachdata_test.xlsx\"\n\n    train_data, test_data = load_and_preprocess_data(train_path, test_path)\n    \n    sea_level_rise = 0.3  # Example value\n    profile_width = 400   # Example value\n    berm_height = 2       # Example value\n    depth_closure = 10    # Example value\n    shape_param = 0.1     # Example shape parameter\n\n    # Calculating additional features via Bruun and Dean models\n    bruun_params_train = calculate_bruun_parameters(sea_level_rise, profile_width, berm_height, depth_closure, train_data['features'])\n    dean_params_train = calculate_dean_parameters(train_data['features'][:, 0], shape_param)\n    bruun_params_test = calculate_bruun_parameters(sea_level_rise, profile_width, berm_height, depth_closure, test_data['features'])\n    dean_params_test = calculate_dean_parameters(test_data['features'][:, 0], shape_param)\n\n    # Incorporate additional features \n    train_data['features'] = np.column_stack([train_data['features'], bruun_params_train, dean_params_train])\n    test_data['features'] = np.column_stack([test_data['features'], bruun_params_test, dean_params_test])\n\n    # Build, train, and evaluate the model\n    model = build_and_train_model(train_data, test_data)\n    rmse, mae = evaluate_model(model, test_data)\n\n    return rmse, mae",
                "plan": "1. **Load and Preprocess Data**:\n   - Load the data from specified paths using pandas.\n   - Encode the categorical 'Dominant Wave Direction' column using one-hot encoding.\n   - Normalize the numerical columns of the data using Min-Max scaling to ensure they are on the same scale.\n   - Prepare input features by concatenating encoded categorical data to normalized numerical data. Separate targets column 'y'.\n\n2. **Calculate Bruun and Dean Parameters**:\n   - Use predefined formulas to calculate Bruun and Dean parameters for each data entry.\n   - Use `calculate_bruun_parameters` to create arrays with a constant shift per feature entry.\n   - Use `calculate_dean_parameters` with each row's first feature as input to calculate Dean parameters.\n\n3. **Build and Train Model**:\n   - Define a simple MLP (Multi-Layer Perceptron) model using PyTorch for regression tasks.\n   - Train the model using the train data over several epochs, minimizing mean squared error.\n\n4. **Evaluate Model**:\n   - Evaluate the trained model on the test dataset using RMSE and MAE metrics.\n\n5. **Combine all Components**:\n   - Define a `main` function that orchestrates loading data, training the model, and evaluating it.\n\n6. **Run without Input**:\n   - Ensure the `main` function runs independently without requiring input, adhering to task specifications.",
                "main_function_name": "main",
                "score": 0.83400787752513,
                "pass_rate": 1.0,
                "pass_rate_score": 1.0,
                "prediction_score": 0.0,
                "pylint_score": 0.658,
                "radon_score": 0.6820787752513,
                "test_case_results": {
                    "runnability_check": {
                        "success": true,
                        "reason": null,
                        "message": "code is runnable"
                    }
                },
                "test_weights": {
                    "runnability_check": 0.001
                }
            }
        }
    },
    {
        "0": {
            "code_0": {
                "code": "import pandas as pd\nimport numpy as np\nfrom sklearn.preprocessing import OneHotEncoder, StandardScaler\nfrom sklearn.model_selection import train_test_split\nimport torch\nimport torch.nn as nn\nimport torch.optim as optim\nimport torch.utils.data as data\n\n# Component: data_loader\ndef data_loader(train_file_path: str, test_file_path: str):\n    # Load data from Excel files\n    train_df = pd.read_excel(train_file_path)\n    test_df = pd.read_excel(test_file_path)\n\n    # One-hot encode the 'Dominant Wave Direction' column\n    encoder = OneHotEncoder(sparse=False)\n    wave_dir_encoded_train = encoder.fit_transform(train_df[['Dominant Wave Direction']])\n    wave_dir_encoded_test = encoder.transform(test_df[['Dominant Wave Direction']])\n\n    # Convert encoded columns back to DataFrame\n    wave_dir_encoded_df_train = pd.DataFrame(wave_dir_encoded_train, \n                                             columns=encoder.get_feature_names_out(['Dominant Wave Direction']))\n    wave_dir_encoded_df_test = pd.DataFrame(wave_dir_encoded_test, \n                                            columns=encoder.get_feature_names_out(['Dominant Wave Direction']))\n\n    # Drop original 'Dominant Wave Direction' column and concatenate encoded columns\n    train_df = train_df.drop(['Dominant Wave Direction'], axis=1)\n    test_df = test_df.drop(['Dominant Wave Direction'], axis=1)\n    train_df = pd.concat([train_df, wave_dir_encoded_df_train], axis=1)\n    test_df = pd.concat([test_df, wave_dir_encoded_df_test], axis=1)\n\n    # Standardize numerical columns\n    scaler = StandardScaler()\n    numerical_columns = train_df.select_dtypes(include=np.number).columns\n    train_df[numerical_columns] = scaler.fit_transform(train_df[numerical_columns])\n    test_df[numerical_columns] = scaler.transform(test_df[numerical_columns])\n\n    return train_df, test_df\n\n# Component: feature_engineering\ndef feature_engineering(df: pd.DataFrame):\n    # Example feature engineering step: create a polynomial feature\n    df['x_squared'] = df['x'] ** 2\n\n    # Placeholder for more complex logic such as domain knowledge features based on Dean and Bruun models\n    # Further analysis can be added here\n\n    return df\n\n# Component: deep_learning_model\nclass DeepLearningModel(nn.Module):\n    def __init__(self, input_dim):\n        super(DeepLearningModel, self).__init__()\n        self.model = nn.Sequential(\n            nn.Linear(input_dim, 128),\n            nn.ReLU(),\n            nn.Dropout(0.3),\n            nn.Linear(128, 64),\n            nn.ReLU(),\n            nn.Linear(64, 1)\n        )\n\n    def forward(self, x):\n        return self.model(x)\n\n# Component: train_and_evaluate_model\ndef train_and_evaluate_model(model, X_train, y_train, X_test, y_test):\n    # Prepare datasets\n    train_dataset = data.TensorDataset(torch.tensor(X_train, dtype=torch.float32), \n                                       torch.tensor(y_train, dtype=torch.float32))\n    test_dataset = data.TensorDataset(torch.tensor(X_test, dtype=torch.float32), \n                                      torch.tensor(y_test, dtype=torch.float32))\n\n    train_loader = data.DataLoader(train_dataset, batch_size=32, shuffle=True)\n    test_loader = data.DataLoader(test_dataset, batch_size=32, shuffle=False)\n\n    # Define optimizer and loss function\n    optimizer = optim.Adam(model.parameters(), lr=0.001)\n    criterion = nn.MSELoss()\n\n    # Training loop\n    for epoch in range(100):  # Example: 100 epochs\n        model.train()\n        for X_batch, y_batch in train_loader:\n            optimizer.zero_grad()\n            outputs = model(X_batch)\n            loss = criterion(outputs.squeeze(), y_batch)\n            loss.backward()\n            optimizer.step()\n\n    # Evaluation\n    model.eval()\n    test_loss = 0\n    with torch.no_grad():\n        for X_batch, y_batch in test_loader:\n            outputs = model(X_batch)\n            loss = criterion(outputs.squeeze(), y_batch)\n            test_loss += loss.item()\n\n    avg_test_loss = test_loss / len(test_loader)\n\n    # Output a dictionary with evaluation results\n    return {\"test_loss\": avg_test_loss}\n\n# Main function integrating all components\ndef main():\n    # Load and preprocess the data\n    train_df, test_df = data_loader(\n        \"beach_profile_data/processed_data/beachdata_train.xlsx\",\n        \"beach_profile_data/processed_data/beachdata_test.xlsx\"\n    )\n\n    # Feature engineering\n    train_df = feature_engineering(train_df)\n    test_df = feature_engineering(test_df)\n\n    # Prepare input data and target\n    features = [col for col in train_df.columns if col != \"y\"]\n    X_train = train_df[features].to_numpy()\n    y_train = train_df['y'].to_numpy()\n    X_test = test_df[features].to_numpy()\n    y_test = test_df['y'].to_numpy()\n\n    # Instatiate deep learning model\n    model = DeepLearningModel(input_dim=X_train.shape[1])\n\n    # Train and evaluate model\n    results = train_and_evaluate_model(model, X_train, y_train, X_test, y_test)\n\n    return results",
                "plan": "1. **Data Loading and Preprocessing**: The `data_loader` function reads the training and test datasets from provided Excel files. It performs one-hot encoding on categorical data and standardizes numerical features for better model learning.\n\n2. **Feature Engineering**: The `feature_engineering` function adds a polynomial feature for demonstration purposes. Other domain knowledge-based features could be added here.\n\n3. **Model Definition**: A simple deep learning model class `DeepLearningModel` is defined using PyTorch, with dropout regularization to reduce overfitting.\n\n4. **Model Training and Evaluation**: `train_and_evaluate_model` drives the training loop for the model, evaluating on both training and test data sets, calculating the test loss which indicates model performance.\n\n5. **Main Integration**: The `main` function brings all components together, managing data processing, feature engineering, model training, and evaluation to return the model's performance metrics.",
                "main_function_name": "main",
                "score": 0.833368516688995,
                "pass_rate": 1.0,
                "pass_rate_score": 1.0,
                "prediction_score": 0.0,
                "pylint_score": 0.6,
                "radon_score": 0.7336851668899504,
                "test_case_results": {
                    "runnability_check": {
                        "success": true,
                        "reason": null,
                        "message": "code is runnable"
                    }
                },
                "test_weights": {
                    "runnability_check": 0.07692307692307693
                }
            }
        }
    },
    {
        "0": {
            "code_0": {
                "code": "import pandas as pd\nimport numpy as np\nfrom sklearn.preprocessing import StandardScaler, OneHotEncoder\nfrom sklearn.model_selection import train_test_split\nfrom sklearn.metrics import mean_squared_error, mean_absolute_error\nimport torch\nimport torch.nn as nn\nimport torch.optim as optim\nfrom scipy.optimize import curve_fit\n\n# Function to load and preprocess the data including encoding, scaling, and splitting\ndef load_and_preprocess_data(train_data_path, test_data_path):\n    # Load data from the given file paths\n    train_df = pd.read_excel(train_data_path)\n    test_df = pd.read_excel(test_data_path)\n    \n    # One-hot encode 'Dominant Wave Direction'\n    one_hot_encoder = OneHotEncoder(sparse=False)\n    for df in [train_df, test_df]:\n        wave_direction_encoded = one_hot_encoder.fit_transform(df[['Dominant Wave Direction']])\n        column_names = [f'WaveDir_{i}' for i in range(wave_direction_encoded.shape[1])]\n        df[column_names] = wave_direction_encoded\n        df.drop(columns=['Dominant Wave Direction'], inplace=True)\n\n    # Scale numerical features using StandardScaler\n    numerical_features = [col for col in train_df.columns if train_df[col].dtype in [np.float64, np.int64] and col not in ['x', 'y']]\n    scaler = StandardScaler()\n    \n    train_df[numerical_features] = scaler.fit_transform(train_df[numerical_features])\n    test_df[numerical_features] = scaler.transform(test_df[numerical_features])\n    \n    # Split the data into features and target\n    x_train = train_df.drop(columns=['y'])\n    y_train = train_df['y']\n    \n    x_test = test_df.drop(columns=['y'])\n    y_test = test_df['y']\n    \n    return (x_train, y_train), (x_test, y_test)\n\n# Function to calculate additional features based on Bruun Rule and Dean Model\ndef bru_and_dean_model_features(df):\n    # Calculate Bruun Rule shoreline recession (S = R / (m + h))\n    # Assumed values as a demonstration; these would be computed based on other data in practice\n    df['ShorelineRecession'] = df['Relative Tidal Range'] / (df['Intertidal Slope'] + df['High Tide Sediment Settling Velocity'])\n    \n    # Fit the Dean model and calculate the 'A' coefficient for 'h(x) = A * x^(2/3)' using curve fitting\n    def dean_model(x, A):\n        return A * np.power(x, 2/3)\n\n    df['Dean_A'] = df.apply(lambda row: curve_fit(dean_model, row['x'], row['y'])[0][0], axis=1)\n    \n    return df\n\n# Build a deep learning model using PyTorch\ndef build_neural_network(input_size, output_size):\n    # Define the neural network architecture\n    model = nn.Sequential(\n        nn.Linear(input_size, 64),\n        nn.ReLU(),\n        nn.Linear(64, 32),\n        nn.ReLU(),\n        nn.Linear(32, output_size)\n    )\n    return model\n\n# Train the PyTorch model and evaluate its performance\ndef train_and_evaluate_model(model, train_data, test_data, epochs):\n    # Unpack train and test data\n    (x_train, y_train), (x_test, y_test) = train_data, test_data\n    \n    # Convert data to PyTorch tensors\n    x_train_tensor = torch.tensor(x_train.values, dtype=torch.float32)\n    y_train_tensor = torch.tensor(y_train.values, dtype=torch.float32).view(-1, 1)\n    x_test_tensor = torch.tensor(x_test.values, dtype=torch.float32)\n    y_test_tensor = torch.tensor(y_test.values, dtype=torch.float32).view(-1, 1)\n    \n    # Loss and optimizer\n    criterion = nn.MSELoss()\n    optimizer = optim.Adam(model.parameters(), lr=0.001)\n    \n    # Train the model\n    for epoch in range(epochs):\n        model.train()\n        optimizer.zero_grad()\n        output = model(x_train_tensor)\n        loss = criterion(output, y_train_tensor)\n        loss.backward()\n        optimizer.step()\n    \n    # Evaluate the model\n    model.eval()\n    with torch.no_grad():\n        test_output = model(x_test_tensor)\n    \n    # Calculate evaluation metrics\n    rmse = mean_squared_error(y_test_tensor, test_output, squared=False)\n    mae = mean_absolute_error(y_test_tensor, test_output)\n    \n    return {'RMSE': rmse, 'MAE': mae}\n\n# Main function to integrate all components\ndef main():\n    # Paths to the data files\n    train_data_path = \"beach_profile_data/processed_data/beachdata_train.xlsx\"\n    test_data_path = \"beach_profile_data/processed_data/beachdata_test.xlsx\"\n    \n    # Load and preprocess data\n    train_data, test_data = load_and_preprocess_data(train_data_path, test_data_path)\n    \n    # Enhance the training and test dataset with additional features\n    x_train, y_train = bru_and_dean_model_features(pd.concat([train_data[0], train_data[1]], axis=1))\n    x_test, y_test = bru_and_dean_model_features(pd.concat([test_data[0], test_data[1]], axis=1))\n    \n    # Prepare input and output data\n    input_size = x_train.shape[1]\n    output_size = 1\n\n    # Build the neural network model using the input size and output size\n    model = build_neural_network(input_size, output_size)\n    \n    # Train and evaluate the model\n    metrics = train_and_evaluate_model(model, (x_train, y_train), (x_test, y_test), epochs=100)\n    \n    # Return the evaluation metrics\n    return metrics",
                "plan": "The implementation follows a structured approach as outlined in the provided plan. Here's a step-by-step explanation of the code's workflow:\n\n1. **`load_and_preprocess_data` Function**:\n   - This function reads the training and test datasets from specified Excel files.\n   - It performs one-hot encoding on the 'Dominant Wave Direction' categorical column.\n   - Numerical features are scaled using StandardScaler to standardize them.\n   - Finally, the function splits the data into features (`x`) and target (`y`) for both training and test sets.\n\n2. **`bru_and_dean_model_features` Function**:\n   - Adds new features to the DataFrame based on the Bruun Rule and Dean Model.\n   - For the Bruun Rule: Computes the shoreline recession using relevant features.\n   - For the Dean Model: Fits a power-law model to compute the parameter A, which is added as a new feature.\n\n3. **`build_neural_network` Function**:\n   - This function creates a PyTorch sequential model.\n   - It consists of a series of linear layers and nonlinear activation functions (ReLU).\n   - The architecture is intended to receive an input size that matches the number of features and to predict a single output.\n\n4. **`train_and_evaluate_model` Function**:\n   - Converts training and test datasets to PyTorch tensors.\n   - Specifies a loss function (MSE) and an optimizer (Adam).\n   - Trains the model for a defined number of epochs.\n   - Evaluates test performance using RMSE and MAE as metrics.\n\n5. **`main` Function**:\n   - Integrates all components in sequence: data loading/preprocessing, feature enhancement, model building, and evaluation.\n   - Uses the described methods to compute metrics for assessing the model's performance.\n\nThe plan ensures that the code is resilient and adheres to the outlined architectural structure, allowing for straightforward execution of the main function.",
                "main_function_name": "main",
                "score": 0.12051565633934598,
                "pass_rate": 0.0,
                "pass_rate_score": 0.0,
                "prediction_score": 0.0,
                "pylint_score": 0.485,
                "radon_score": 0.7201565633934598,
                "test_case_results": {
                    "runnability_check": {
                        "success": false,
                        "reason": "test_failed",
                        "message": "code is not runnable, error: Traceback (most recent call last):\n  File \"<string>\", line 4, in test_function\n  File \"<string>\", line 109, in main\n  File \"<string>\", line 30, in load_and_preprocess_data\n  File \"d:\\anaconda3\\envs\\llm\\lib\\site-packages\\pandas\\core\\frame.py\", line 3902, in __getitem__\n    indexer = self.columns._get_indexer_strict(key, \"columns\")[1]\n  File \"d:\\anaconda3\\envs\\llm\\lib\\site-packages\\pandas\\core\\indexes\\base.py\", line 6114, in _get_indexer_strict\n    self._raise_if_missing(keyarr, indexer, axis_name)\n  File \"d:\\anaconda3\\envs\\llm\\lib\\site-packages\\pandas\\core\\indexes\\base.py\", line 6178, in _raise_if_missing\n    raise KeyError(f\"{not_found} not in index\")\nKeyError: \"['WaveDir_3'] not in index\"\n"
                    }
                },
                "test_weights": {
                    "runnability_check": 0.023668639053254437
                }
            }
        },
        "1": {
            "code_0": {
                "code": "import pandas as pd\nimport numpy as np\nfrom sklearn.preprocessing import StandardScaler, OneHotEncoder\nfrom sklearn.model_selection import train_test_split\nfrom sklearn.metrics import mean_squared_error, mean_absolute_error\nimport torch\nimport torch.nn as nn\nimport torch.optim as optim\nfrom scipy.optimize import curve_fit\n\n# Function to load and preprocess the data including encoding, scaling, and splitting\ndef load_and_preprocess_data(train_data_path, test_data_path):\n    # Load data from the given file paths\n    train_df = pd.read_excel(train_data_path)\n    test_df = pd.read_excel(test_data_path)\n    \n    # Combine the data to ensure consistent encoding\n    combined_df = pd.concat([train_df, test_df])\n    \n    # One-hot encode 'Dominant Wave Direction'\n    one_hot_encoder = OneHotEncoder(sparse=False)\n    wave_direction_encoded = one_hot_encoder.fit_transform(combined_df[['Dominant Wave Direction']])\n    column_names = [f'WaveDir_{i}' for i in range(wave_direction_encoded.shape[1])]\n    \n    # Add encoded features to the combined dataframe\n    wave_direction_df = pd.DataFrame(wave_direction_encoded, columns=column_names, index=combined_df.index)\n    combined_df = pd.concat([combined_df, wave_direction_df], axis=1)\n    combined_df.drop(columns=['Dominant Wave Direction'], inplace=True)\n    \n    # Split back the combined dataframe into train and test sets\n    train_df = combined_df.loc[train_df.index]\n    test_df = combined_df.loc[test_df.index]\n\n    # Scale numerical features using StandardScaler\n    numerical_features = [col for col in train_df.columns if train_df[col].dtype in [np.float64, np.int64] and col not in ['x', 'y']]\n    scaler = StandardScaler()\n    \n    train_df[numerical_features] = scaler.fit_transform(train_df[numerical_features])\n    test_df[numerical_features] = scaler.transform(test_df[numerical_features])\n    \n    # Split the data into features and target\n    x_train = train_df.drop(columns=['y'])\n    y_train = train_df['y']\n    \n    x_test = test_df.drop(columns=['y'])\n    y_test = test_df['y']\n    \n    return (x_train, y_train), (x_test, y_test)\n\n# Function to calculate additional features based on Bruun Rule and Dean Model\ndef bru_and_dean_model_features(df):\n    # Calculate Bruun Rule shoreline recession (S = R / (m + h))\n    df['ShorelineRecession'] = df['Relative Tidal Range'] / (df['Intertidal Slope'] + df['High Tide Sediment Settling Velocity'])\n    \n    # Fit the Dean model and calculate the 'A' coefficient for 'h(x) = A * x^(2/3)' using curve fitting\n    def dean_model(x, A):\n        return A * np.power(x, 2/3)\n\n    def fit_dean_model(row):\n        try:\n            A, _ = curve_fit(dean_model, np.array([row['x']]), np.array([row['y']]))\n            return A[0]\n        except:\n            return np.nan # Handle cases where curve fitting fails\n\n    df['Dean_A'] = df.apply(fit_dean_model, axis=1)\n    \n    return df\n\n# Build a deep learning model using PyTorch\ndef build_neural_network(input_size, output_size):\n    # Define the neural network architecture\n    model = nn.Sequential(\n        nn.Linear(input_size, 64),\n        nn.ReLU(),\n        nn.Linear(64, 32),\n        nn.ReLU(),\n        nn.Linear(32, output_size)\n    )\n    return model\n\n# Train the PyTorch model and evaluate its performance\ndef train_and_evaluate_model(model, train_data, test_data, epochs):\n    # Unpack train and test data\n    (x_train, y_train), (x_test, y_test) = train_data, test_data\n    \n    # Convert data to PyTorch tensors\n    x_train_tensor = torch.tensor(x_train.values, dtype=torch.float32)\n    y_train_tensor = torch.tensor(y_train.values, dtype=torch.float32).view(-1, 1)\n    x_test_tensor = torch.tensor(x_test.values, dtype=torch.float32)\n    y_test_tensor = torch.tensor(y_test.values, dtype=torch.float32).view(-1, 1)\n    \n    # Loss and optimizer\n    criterion = nn.MSELoss()\n    optimizer = optim.Adam(model.parameters(), lr=0.001)\n    \n    # Train the model\n    for epoch in range(epochs):\n        model.train()\n        optimizer.zero_grad()\n        output = model(x_train_tensor)\n        loss = criterion(output, y_train_tensor)\n        loss.backward()\n        optimizer.step()\n    \n    # Evaluate the model\n    model.eval()\n    with torch.no_grad():\n        test_output = model(x_test_tensor)\n    \n    # Calculate evaluation metrics\n    rmse = mean_squared_error(y_test_tensor, test_output, squared=False)\n    mae = mean_absolute_error(y_test_tensor, test_output)\n    \n    return {'RMSE': rmse, 'MAE': mae}\n\n# Main function to integrate all components\ndef main():\n    # Paths to the data files\n    train_data_path = \"beach_profile_data/processed_data/beachdata_train.xlsx\"\n    test_data_path = \"beach_profile_data/processed_data/beachdata_test.xlsx\"\n    \n    # Load and preprocess data\n    train_data, test_data = load_and_preprocess_data(train_data_path, test_data_path)\n    \n    # Enhance the training and test datasets with additional features\n    train_df = pd.concat([train_data[0], train_data[1]], axis=1)\n    test_df = pd.concat([test_data[0], test_data[1]], axis=1)\n    \n    train_df = bru_and_dean_model_features(train_df)\n    test_df = bru_and_dean_model_features(test_df)\n    \n    # Update processed train and test data\n    x_train = train_df.drop(columns=['y'])\n    y_train = train_df['y']\n    \n    x_test = test_df.drop(columns=['y'])\n    y_test = test_df['y']\n    \n    # Prepare input and output data\n    input_size = x_train.shape[1]\n    output_size = 1\n\n    # Build the neural network model using the input size and output size\n    model = build_neural_network(input_size, output_size)\n    \n    # Train and evaluate the model\n    metrics = train_and_evaluate_model(model, (x_train, y_train), (x_test, y_test), epochs=100)\n    \n    # Return the evaluation metrics\n    return metrics",
                "plan": "1. **Data Loading**: Import the necessary libraries and load the training and testing data from the specified file paths using `pandas.read_excel`.\n\n2. **Data Preprocessing**: \n   - Concatenate train and test datasets for consistent one-hot encoding.\n   - Perform one-hot encoding for the 'Dominant Wave Direction' feature and integrate it into the data.\n   - Scale numerical features using `StandardScaler` to ensure model stability and performance.\n\n3. **Feature Engineering**:\n   - Create additional features based on Bruun Rule and Dean Model by adding 'ShorelineRecession' and 'Dean_A' to the dataset. \n   - Handle exceptional cases in Dean model fitting to prevent runtime errors.\n\n4. **Model Building**:\n   - Use PyTorch to define a neural network with a sequential architecture composed of three layers with ReLU activations.\n\n5. **Model Training & Evaluation**:\n   - Convert the training and testing data into `torch` tensors.\n   - Train the model using the Adam optimizer and MSELoss criterion over a defined number of epochs.\n   - Evaluate the model using RMSE and MAE, providing a comprehensive view of performance.\n\n6. **Main Function Execution**:\n   - Integrate the workflow through the main function, `main`, which loads data, preprocesses it, augments it with additional features, constructs the model, trains and evaluates it, and finally, returns the performance metrics.",
                "main_function_name": "main",
                "score": 0.8171666148142649,
                "pass_rate": 1.0,
                "pass_rate_score": 1.0,
                "prediction_score": 0.0,
                "pylint_score": 0.47000000000000003,
                "radon_score": 0.7016661481426485,
                "test_case_results": {
                    "runnability_check": {
                        "success": true,
                        "reason": null,
                        "message": "code is runnable"
                    }
                },
                "test_weights": {
                    "runnability_check": 0.023668639053254437
                }
            }
        }
    },
    {
        "0": {
            "code_0": {
                "code": "import pandas as pd\nimport torch\nimport torch.nn as nn\nfrom torch.utils.data import DataLoader, TensorDataset\nfrom sklearn.preprocessing import OneHotEncoder, StandardScaler\nimport numpy as np\n\n# Load the data from Excel files\ndef load_data(train_path, test_path):\n    train_data = pd.read_excel(train_path)\n    test_data = pd.read_excel(test_path)\n    return train_data, test_data\n\n# One-hot encode the 'Dominant Wave Direction' feature\ndef encode_wave_direction(dataframe):\n    encoder = OneHotEncoder(sparse=False)\n    wave_direction_encoded = encoder.fit_transform(dataframe[['Dominant Wave Direction']])\n    wave_direction_df = pd.DataFrame(wave_direction_encoded, columns=encoder.get_feature_names_out(['Dominant Wave Direction']))\n    dataframe = dataframe.drop('Dominant Wave Direction', axis=1)\n    dataframe = pd.concat([dataframe, wave_direction_df], axis=1)\n    return dataframe\n\n# Normalize continuous features\ndef preprocess_features(dataframe):\n    # Assume features to normalize exclude 'x' and 'y'\n    features_to_normalize = dataframe.drop(['x', 'y'], axis=1).select_dtypes(include=[np.number]).columns\n    scaler = StandardScaler()\n    dataframe[features_to_normalize] = scaler.fit_transform(dataframe[features_to_normalize])\n    return dataframe\n\n# Compute the shoreline retreat using the Bruun rule\ndef compute_bruun_retreat(R, B, h):\n    return (R * B) / (h + B)\n\n# Compute the water depth using the Dean model\ndef compute_dean_depth(A, x):\n    return A * (x ** (2/3))\n\n# Build and compile a PyTorch deep learning model\ndef build_deep_learning_model(input_dim):\n    model = nn.Sequential(\n        nn.Linear(input_dim, 64),\n        nn.ReLU(),\n        nn.Linear(64, 32),\n        nn.ReLU(),\n        nn.Linear(32, 1)  # Output layer for regression\n    )\n    return model\n\n# Train the PyTorch model\ndef train_model(model, train_loader, epochs):\n    criterion = nn.MSELoss()\n    optimizer = torch.optim.Adam(model.parameters(), lr=0.001)\n    model.train()\n    \n    for epoch in range(epochs):\n        for inputs, targets in train_loader:\n            optimizer.zero_grad()\n            outputs = model(inputs)\n            loss = criterion(outputs, targets)\n            loss.backward()\n            optimizer.step()\n    \n    return model\n\n# Evaluate the trained model\ndef evaluate_model(model, test_loader):\n    model.eval()\n    total_loss = 0\n    criterion = nn.MSELoss()\n    \n    with torch.no_grad():\n        for inputs, targets in test_loader:\n            outputs = model(inputs)\n            loss = criterion(outputs, targets)\n            total_loss += loss.item()\n    \n    # Calculate mean loss\n    mean_loss = total_loss / len(test_loader)\n    return {\"Mean Square Error\": mean_loss}\n\n# Main function to integrate all components\ndef main():\n    # Load data\n    train_path = \"beach_profile_data/processed_data/beachdata_train.xlsx\"\n    test_path = \"beach_profile_data/processed_data/beachdata_test.xlsx\"\n    \n    train_data, test_data = load_data(train_path, test_path)\n    \n    # Preprocessing\n    train_data = encode_wave_direction(train_data)\n    test_data = encode_wave_direction(test_data)\n    \n    train_data = preprocess_features(train_data)\n    test_data = preprocess_features(test_data)\n    \n    # Prepare data for deep learning\n    X_train = torch.tensor(train_data.drop('y', axis=1).values, dtype=torch.float32)\n    y_train = torch.tensor(train_data['y'].values, dtype=torch.float32).view(-1, 1)\n    train_dataset = TensorDataset(X_train, y_train)\n    train_loader = DataLoader(train_dataset, batch_size=32, shuffle=True)\n    \n    X_test = torch.tensor(test_data.drop('y', axis=1).values, dtype=torch.float32)\n    y_test = torch.tensor(test_data['y'].values, dtype=torch.float32).view(-1, 1)\n    test_dataset = TensorDataset(X_test, y_test)\n    test_loader = DataLoader(test_dataset, batch_size=32, shuffle=False)\n    \n    # Build model\n    input_dim = X_train.shape[1]\n    model = build_deep_learning_model(input_dim)\n\n    # Train model\n    epochs = 100\n    trained_model = train_model(model, train_loader, epochs)\n    \n    # Evaluate model\n    evaluation_metrics = evaluate_model(trained_model, test_loader)\n    \n    return evaluation_metrics",
                "plan": "1. **Load Data**: The load_data function handles the reading of both training and testing datasets from their respective paths using pandas.\n\n2. **Encode Wave Direction**: The encode_wave_direction function converts the 'Dominant Wave Direction' categorical column into a numerical format using one-hot encoding. This is crucial for incorporating categorical data into our model.\n\n3. **Feature Normalization**: The preprocess_features function normalizes continuous variables (excluding 'x' and 'y'), ensuring that each feature contributes proportionately to the distance and directional calculations.\n\n4. **Build Neural Network Model**: The build_deep_learning_model function constructs a PyTorch neural network suitable for regression problems.\n\n5. **Training Process**: The train_model function iterates over the dataset multiple times (epochs), adjusting weights to minimize the loss function.\n\n6. **Evaluation**: The evaluate_model function computes the final mean squared error on the testing dataset, which gauges model performance.\n\nThe deep learning model integrates elements of the Bruun and Dean models through feature preprocessing, taking into account both historical approaches to model predictive innovation statistically and computationally.\n\nThe execution of the main function in this script is self-contained and will sequentially follow the above steps when called.",
                "main_function_name": "main",
                "score": 0.1237056723661825,
                "pass_rate": 0.0,
                "pass_rate_score": 0.0,
                "prediction_score": 0.0,
                "pylint_score": 0.554,
                "radon_score": 0.683056723661825,
                "test_case_results": {
                    "runnability_check": {
                        "success": false,
                        "reason": "test_failed",
                        "message": "code is not runnable, error: Traceback (most recent call last):\n  File \"<string>\", line 4, in test_function\n  File \"<string>\", line 117, in main\n  File \"<string>\", line 74, in evaluate_model\n  File \"d:\\anaconda3\\envs\\llm\\lib\\site-packages\\torch\\nn\\modules\\module.py\", line 1532, in _wrapped_call_impl\n    return self._call_impl(*args, **kwargs)\n  File \"d:\\anaconda3\\envs\\llm\\lib\\site-packages\\torch\\nn\\modules\\module.py\", line 1541, in _call_impl\n    return forward_call(*args, **kwargs)\n  File \"d:\\anaconda3\\envs\\llm\\lib\\site-packages\\torch\\nn\\modules\\container.py\", line 217, in forward\n    input = module(input)\n  File \"d:\\anaconda3\\envs\\llm\\lib\\site-packages\\torch\\nn\\modules\\module.py\", line 1532, in _wrapped_call_impl\n    return self._call_impl(*args, **kwargs)\n  File \"d:\\anaconda3\\envs\\llm\\lib\\site-packages\\torch\\nn\\modules\\module.py\", line 1541, in _call_impl\n    return forward_call(*args, **kwargs)\n  File \"d:\\anaconda3\\envs\\llm\\lib\\site-packages\\torch\\nn\\modules\\linear.py\", line 116, in forward\n    return F.linear(input, self.weight, self.bias)\nRuntimeError: mat1 and mat2 shapes cannot be multiplied (32x27 and 28x64)\n"
                    }
                },
                "test_weights": {
                    "runnability_check": 0.007100591715976331
                }
            }
        },
        "1": {
            "code_0": {
                "code": "import pandas as pd\nimport torch\nimport torch.nn as nn\nfrom torch.utils.data import DataLoader, TensorDataset\nfrom sklearn.preprocessing import OneHotEncoder, StandardScaler\nimport numpy as np\n\n# Load the data from Excel files\ndef load_data(train_path, test_path):\n    train_data = pd.read_excel(train_path)\n    test_data = pd.read_excel(test_path)\n    return train_data, test_data\n\n# One-hot encode the 'Dominant Wave Direction' feature\ndef encode_wave_direction(dataframe):\n    encoder = OneHotEncoder(sparse_output=False)\n    wave_direction_encoded = encoder.fit_transform(dataframe[['Dominant Wave Direction']])\n    wave_direction_df = pd.DataFrame(wave_direction_encoded, columns=encoder.get_feature_names_out(['Dominant Wave Direction']))\n    dataframe = dataframe.drop('Dominant Wave Direction', axis=1)\n    dataframe = pd.concat([dataframe, wave_direction_df], axis=1)\n    return dataframe\n\n# Normalize continuous features\ndef preprocess_features(dataframe):\n    # Calculate features to normalize, excluding 'x' and 'y'\n    features_to_normalize = dataframe.drop(['x', 'y'], axis=1).select_dtypes(include=[np.number]).columns\n    scaler = StandardScaler()\n    dataframe[features_to_normalize] = scaler.fit_transform(dataframe[features_to_normalize])\n    return dataframe\n\n# Compute the shoreline retreat using the Bruun rule\ndef compute_bruun_retreat(R, B, h):\n    return (R * B) / (h + B)\n\n# Compute the water depth using the Dean model\ndef compute_dean_depth(A, x):\n    return A * (x ** (2/3))\n\n# Build and compile a PyTorch deep learning model\ndef build_deep_learning_model(input_dim):\n    model = nn.Sequential(\n        nn.Linear(input_dim, 64),\n        nn.ReLU(),\n        nn.Linear(64, 32),\n        nn.ReLU(),\n        nn.Linear(32, 1)  # Output layer for regression\n    )\n    return model\n\n# Train the PyTorch model\ndef train_model(model, train_loader, epochs):\n    criterion = nn.MSELoss()\n    optimizer = torch.optim.Adam(model.parameters(), lr=0.001)\n    model.train()\n    \n    for epoch in range(epochs):\n        for inputs, targets in train_loader:\n            optimizer.zero_grad()\n            outputs = model(inputs)\n            loss = criterion(outputs, targets)\n            loss.backward()\n            optimizer.step()\n    \n    return model\n\n# Evaluate the trained model\ndef evaluate_model(model, test_loader):\n    model.eval()\n    total_loss = 0\n    criterion = nn.MSELoss()\n    \n    with torch.no_grad():\n        for inputs, targets in test_loader:\n            outputs = model(inputs)\n            loss = criterion(outputs, targets)\n            total_loss += loss.item()\n    \n    # Calculate mean loss\n    mean_loss = total_loss / len(test_loader)\n    return {\"Mean Square Error\": mean_loss}\n\n# Main function to integrate all components\ndef main():\n    # Load data\n    train_path = \"beach_profile_data/processed_data/beachdata_train.xlsx\"\n    test_path = \"beach_profile_data/processed_data/beachdata_test.xlsx\"\n    \n    train_data, test_data = load_data(train_path, test_path)\n    \n    # Preprocessing\n    train_data = encode_wave_direction(train_data)\n    test_data = encode_wave_direction(test_data)\n    \n    train_data = preprocess_features(train_data)\n    test_data = preprocess_features(test_data)\n    \n    # Prepare data for deep learning\n    X_train = torch.tensor(train_data.drop('y', axis=1).values, dtype=torch.float32)\n    y_train = torch.tensor(train_data['y'].values, dtype=torch.float32).view(-1, 1)\n    train_dataset = TensorDataset(X_train, y_train)\n    train_loader = DataLoader(train_dataset, batch_size=32, shuffle=True)\n    \n    X_test = torch.tensor(test_data.drop('y', axis=1).values, dtype=torch.float32)\n    y_test = torch.tensor(test_data['y'].values, dtype=torch.float32).view(-1, 1)\n    test_dataset = TensorDataset(X_test, y_test)\n    test_loader = DataLoader(test_dataset, batch_size=32, shuffle=False)\n    \n    # Build model\n    input_dim = X_train.shape[1]  # Correct input dimension after preprocessing\n    model = build_deep_learning_model(input_dim)\n\n    # Train model\n    epochs = 100\n    trained_model = train_model(model, train_loader, epochs)\n    \n    # Evaluate model\n    evaluation_metrics = evaluate_model(trained_model, test_loader)\n    \n    return evaluation_metrics",
                "plan": "1. **Data Loading**: Use `pandas` to load training and test data from Excel files.\n2. **Encoding**: Convert the 'Dominant Wave Direction' categorical column to a numerical format using one-hot encoding to make it suitable for machine learning models.\n3. **Normalization**: Standardize all numerical features except 'x' and 'y' using `StandardScaler` to improve model performance.\n4. **Mathematical Model Exploration**:\n   - Implement computation based on the Bruun rule and the Dean model formulas, although not directly used in model training here; these equations provide insight into coastal dynamics.\n5. **Deep Learning Model Building**:\n   - Define a simple feedforward neural network with input dimensions matching the preprocessed feature set to avoid shape mismatches.\n6. **Training**: Use an Adam optimizer to train the model, applying an MSE loss function over a prescribed number of epochs.\n7. **Evaluation**: Validate the model on test data and return metrics like mean squared error to assess performance.\n8. **Integration**: Compose everything within a `main()` function for easy execution and integration of the entire preprocessing and modeling pipeline.",
                "main_function_name": "main",
                "score": 0.12413357841782123,
                "pass_rate": 0.0,
                "pass_rate_score": 0.0,
                "prediction_score": 0.0,
                "pylint_score": 0.554,
                "radon_score": 0.6873357841782122,
                "test_case_results": {
                    "runnability_check": {
                        "success": false,
                        "reason": "test_failed",
                        "message": "code is not runnable, error: Traceback (most recent call last):\n  File \"<string>\", line 4, in test_function\n  File \"<string>\", line 117, in main\n  File \"<string>\", line 74, in evaluate_model\n  File \"d:\\anaconda3\\envs\\llm\\lib\\site-packages\\torch\\nn\\modules\\module.py\", line 1532, in _wrapped_call_impl\n    return self._call_impl(*args, **kwargs)\n  File \"d:\\anaconda3\\envs\\llm\\lib\\site-packages\\torch\\nn\\modules\\module.py\", line 1541, in _call_impl\n    return forward_call(*args, **kwargs)\n  File \"d:\\anaconda3\\envs\\llm\\lib\\site-packages\\torch\\nn\\modules\\container.py\", line 217, in forward\n    input = module(input)\n  File \"d:\\anaconda3\\envs\\llm\\lib\\site-packages\\torch\\nn\\modules\\module.py\", line 1532, in _wrapped_call_impl\n    return self._call_impl(*args, **kwargs)\n  File \"d:\\anaconda3\\envs\\llm\\lib\\site-packages\\torch\\nn\\modules\\module.py\", line 1541, in _call_impl\n    return forward_call(*args, **kwargs)\n  File \"d:\\anaconda3\\envs\\llm\\lib\\site-packages\\torch\\nn\\modules\\linear.py\", line 116, in forward\n    return F.linear(input, self.weight, self.bias)\nRuntimeError: mat1 and mat2 shapes cannot be multiplied (32x27 and 28x64)\n"
                    }
                },
                "test_weights": {
                    "runnability_check": 0.00109239872553482
                }
            }
        },
        "2": {
            "code_0": {
                "code": "import pandas as pd\nimport torch\nimport torch.nn as nn\nfrom torch.utils.data import DataLoader, TensorDataset\nfrom sklearn.preprocessing import OneHotEncoder, StandardScaler\nimport numpy as np\n\ndef load_data(train_path, test_path):\n    train_data = pd.read_excel(train_path)\n    test_data = pd.read_excel(test_path)\n    return train_data, test_data\n\ndef encode_wave_direction(dataframe, encoder=None):\n    if encoder is None:\n        encoder = OneHotEncoder(sparse_output=False)\n        wave_direction_encoded = encoder.fit_transform(dataframe[['Dominant Wave Direction']])\n    else:\n        wave_direction_encoded = encoder.transform(dataframe[['Dominant Wave Direction']])\n    \n    wave_direction_df = pd.DataFrame(wave_direction_encoded, columns=encoder.get_feature_names_out(['Dominant Wave Direction']))\n    dataframe = dataframe.drop('Dominant Wave Direction', axis=1)\n    dataframe = pd.concat([dataframe, wave_direction_df], axis=1)\n    \n    return dataframe, encoder\n\ndef preprocess_features(dataframe, scaler=None):\n    features_to_normalize = dataframe.drop(['x', 'y'], axis=1, errors='ignore').select_dtypes(include=[np.number]).columns\n    \n    if scaler is None:\n        scaler = StandardScaler()\n        dataframe[features_to_normalize] = scaler.fit_transform(dataframe[features_to_normalize])\n    else:\n        dataframe[features_to_normalize] = scaler.transform(dataframe[features_to_normalize])\n    \n    return dataframe, scaler\n\ndef compute_bruun_retreat(R, B, h):\n    return (R * B) / (h + B)\n\ndef compute_dean_depth(A, x):\n    return A * (x ** (2/3))\n\ndef build_deep_learning_model(input_dim):\n    model = nn.Sequential(\n        nn.Linear(input_dim, 64),\n        nn.ReLU(),\n        nn.Linear(64, 32),\n        nn.ReLU(),\n        nn.Linear(32, 1)  # Output layer for regression\n    )\n    return model\n\ndef train_model(model, train_loader, epochs):\n    criterion = nn.MSELoss()\n    optimizer = torch.optim.Adam(model.parameters(), lr=0.001)\n    model.train()\n    \n    for epoch in range(epochs):\n        for inputs, targets in train_loader:\n            optimizer.zero_grad()\n            outputs = model(inputs)\n            loss = criterion(outputs, targets)\n            loss.backward()\n            optimizer.step()\n    \n    return model\n\ndef evaluate_model(model, test_loader):\n    model.eval()\n    total_loss = 0\n    criterion = nn.MSELoss()\n    \n    with torch.no_grad():\n        for inputs, targets in test_loader:\n            outputs = model(inputs)\n            loss = criterion(outputs, targets)\n            total_loss += loss.item()\n    \n    mean_loss = total_loss / len(test_loader)\n    return {\"Mean Square Error\": mean_loss}\n\ndef main():\n    train_path = \"beach_profile_data/processed_data/beachdata_train.xlsx\"\n    test_path = \"beach_profile_data/processed_data/beachdata_test.xlsx\"\n    \n    train_data, test_data = load_data(train_path, test_path)\n    \n    train_data, encoder = encode_wave_direction(train_data)\n    test_data, _ = encode_wave_direction(test_data, encoder=encoder)\n    \n    train_data, scaler = preprocess_features(train_data)\n    test_data, _ = preprocess_features(test_data, scaler=scaler)\n    \n    X_train = torch.tensor(train_data.drop('y', axis=1).values, dtype=torch.float32)\n    y_train = torch.tensor(train_data['y'].values, dtype=torch.float32).view(-1, 1)\n    train_dataset = TensorDataset(X_train, y_train)\n    train_loader = DataLoader(train_dataset, batch_size=32, shuffle=True)\n    \n    X_test = torch.tensor(test_data.drop('y', axis=1).values, dtype=torch.float32)\n    y_test = torch.tensor(test_data['y'].values, dtype=torch.float32).view(-1, 1)\n    test_dataset = TensorDataset(X_test, y_test)\n    test_loader = DataLoader(test_dataset, batch_size=32, shuffle=False)\n    \n    input_dim = X_train.shape[1]\n    model = build_deep_learning_model(input_dim)\n    \n    epochs = 100\n    trained_model = train_model(model, train_loader, epochs)\n    \n    evaluation_metrics = evaluate_model(trained_model, test_loader)\n    \n    return evaluation_metrics",
                "plan": "1. **Data Loading**: The main function begins by loading the train and test datasets using `load_data()`.\n\n2. **Preprocessing**: \n   - The categorical 'Dominant Wave Direction' column is one-hot encoded using `encode_wave_direction()`.\n   - Numerical features are normalized using `preprocess_features()`.\n   - Ensures both the encoder and scaler are applied consistently across training and test sets to prevent dimension mismatch errors.\n\n3. **Model Configuration**:\n   - Defines and composes a sequential PyTorch model tailored for regression in `build_deep_learning_model()`.\n\n4. **Training Process**:\n   - Optimizes the model through gradient descent using the Adam optimizer by examining mean squared error loss during training with `train_model()`.\n\n5. **Evaluation**:\n   - It evaluates the trained model on test data by predicting and computing mean squared error in `evaluate_model()`.\n\n6. **Execution**: \n   - It integrates all the above functions into a main function named `main()`, loading, preprocessing, training, and finally evaluating the model.",
                "main_function_name": "main",
                "score": 0.7999474777671158,
                "pass_rate": 1.0,
                "pass_rate_score": 1.0,
                "prediction_score": 0.0,
                "pylint_score": 0.513,
                "radon_score": 0.4864747776711589,
                "test_case_results": {
                    "runnability_check": {
                        "success": true,
                        "reason": null,
                        "message": "code is runnable"
                    }
                },
                "test_weights": {
                    "runnability_check": 0.00109239872553482
                }
            }
        }
    },
    {
        "0": {
            "code_0": {
                "code": "import pandas as pd\nimport torch\nfrom torch import nn\nfrom torch.utils.data import DataLoader, TensorDataset\nfrom sklearn.model_selection import train_test_split\nfrom sklearn.preprocessing import StandardScaler, OneHotEncoder\nimport numpy as np\n\ndef load_data(train_file: str, test_file: str):\n    # Load the Excel files into Pandas DataFrames\n    train_data = pd.read_excel(train_file)\n    test_data = pd.read_excel(test_file)\n    \n    # Identify and fill any missing values\n    train_data.fillna(method='ffill', inplace=True)\n    test_data.fillna(method='ffill', inplace=True)\n    \n    # One-hot encode the 'Dominant Wave Direction'\n    encoder = OneHotEncoder(sparse=False)\n    direction_encoded_train = encoder.fit_transform(train_data[['Dominant Wave Direction']])\n    direction_encoded_test = encoder.transform(test_data[['Dominant Wave Direction']])\n    \n    columns_encoded = encoder.get_feature_names_out(['Dominant Wave Direction'])\n    train_data_encoded = pd.concat([train_data, pd.DataFrame(direction_encoded_train, columns=columns_encoded)], axis=1)\n    test_data_encoded = pd.concat([test_data, pd.DataFrame(direction_encoded_test, columns=columns_encoded)], axis=1)\n    \n    # Normalize numerical features\n    numerical_features = ['x', 'Breaker Wave Height Hb', 'Deep Water Wave Height Hd', 'Annual Mean Period']\n    scaler = StandardScaler()\n    train_data_encoded[numerical_features] = scaler.fit_transform(train_data_encoded[numerical_features])\n    test_data_encoded[numerical_features] = scaler.transform(test_data_encoded[numerical_features])\n    \n    return train_data_encoded, test_data_encoded\n\ndef bruun_model(S: float, L: float, B: float, h: float) -> float:\n    # Use the Bruun Rule formula to compute the horizontal shift of the shoreline.\n    delta_X = (S * L) / (B + h)\n    return delta_X\n\ndef dean_model(y: float, A: float) -> float:\n    # Use the Dean model formula to compute the water depth at given distance.\n    h_y = A * (y ** (2 / 3))\n    return h_y\n\ndef build_model(train_data: pd.DataFrame, test_data: pd.DataFrame) -> nn.Module:\n    # Define target and features\n    feature_columns = ['x', 'Breaker Wave Height Hb', 'Deep Water Wave Height Hd', \n                       'Annual Mean Period'] + \\\n                      list(train_data.filter(regex='Dominant Wave Direction_').columns)\n    X_train = train_data[feature_columns].values\n    y_train = train_data['y'].values\n\n    X_test = test_data[feature_columns].values\n    y_test = test_data['y'].values\n    \n    # Convert to tensors\n    X_train_tensor = torch.tensor(X_train, dtype=torch.float32)\n    y_train_tensor = torch.tensor(y_train, dtype=torch.float32).view(-1, 1)\n    X_test_tensor = torch.tensor(X_test, dtype=torch.float32)\n    y_test_tensor = torch.tensor(y_test, dtype=torch.float32).view(-1, 1)\n    \n    # Define a simple fully connected neural network model\n    class BeachProfileModel(nn.Module):\n        def __init__(self, input_dim):\n            super(BeachProfileModel, self).__init__()\n            self.fc1 = nn.Linear(input_dim, 64)\n            self.relu1 = nn.ReLU()\n            self.fc2 = nn.Linear(64, 32)\n            self.relu2 = nn.ReLU()\n            self.fc3 = nn.Linear(32, 1)\n        \n        def forward(self, x):\n            x = self.fc1(x)\n            x = self.relu1(x)\n            x = self.fc2(x)\n            x = self.relu2(x)\n            x = self.fc3(x)\n            return x\n\n    # Instantiate the model, define loss and optimizer\n    model = BeachProfileModel(input_dim=X_train.shape[1])\n    criterion = nn.MSELoss()\n    optimizer = torch.optim.Adam(model.parameters(), lr=0.001)\n    \n    # Create DataLoader for training\n    train_dataset = TensorDataset(X_train_tensor, y_train_tensor)\n    train_loader = DataLoader(train_dataset, batch_size=16, shuffle=True)\n    \n    # Train the model\n    model.train()\n    for epoch in range(100):  # example number of epochs\n        for X_batch, y_batch in train_loader:\n            optimizer.zero_grad()\n            predictions = model(X_batch)\n            loss = criterion(predictions, y_batch)\n            loss.backward()\n            optimizer.step()\n\n    return model\n\ndef main():\n    # Load and preprocess the data\n    train_data, test_data = load_data(\"beach_profile_data/processed_data/beachdata_train.xlsx\",\n                                      \"beach_profile_data/processed_data/beachdata_test.xlsx\")\n    \n    # Example usage of Bruun and Dean models\n    bruun_shift = bruun_model(S=0.5, L=1000, B=2, h=10)\n    dean_depth = dean_model(y=50, A=0.1)\n    \n    # Train the deep learning model\n    model = build_model(train_data, test_data)",
                "plan": "Step-by-step explanation:\n\n1. **Data Loading and Preprocessing**:\n   - The `load_data` function reads Excel files into Pandas DataFrames, handles missing values by forward filling, and encodes the categorical 'Dominant Wave Direction' using one-hot encoding.\n   - Numerical features relevant to geography and wave dynamics are standardized for improved model performance.\n\n2. **Implementation of Bruun and Dean Models**:\n   - `bruun_model` calculates the shore horizontal shift due to sea level rise using the inputs and the Bruun Rule formula.\n   - `dean_model` computes the water depth using the Dean model formula based on distance from shore and a defined sediment scale parameter.\n\n3. **Deep Learning Model**:\n   - In `build_model`, relevant features and target variables are extracted from datasets and converted into PyTorch tensors.\n   - A simple feedforward neural network (`BeachProfileModel`) is defined to capture complex relationships in the provided dataset. It includes two hidden layers activated by ReLU and an output layer, suitable for regression problems.\n   - The data is loaded using `DataLoader`, and the model is trained with mean square error loss function and Adam optimizer, going over 100 epochs (as an example).\n\n4. **Main Function**:\n   - Calls all components to load and preprocess data, apply the Bruun and Dean models, and train the deep learning model using the functions defined.\n\nThis holistic approach integrates domain knowledge into predictive modeling, reflecting both conceptual models (Bruun and Dean) and detailed predictive models (neural networks). The models can be extended with more sophisticated architectures or features as needed in further testing and deployment phases.",
                "main_function_name": "main",
                "score": 0.8055071884703703,
                "pass_rate": 1.0,
                "pass_rate_score": 1.0,
                "prediction_score": 0.0,
                "pylint_score": 0.37,
                "radon_score": 0.685071884703703,
                "test_case_results": {
                    "runnability_check": {
                        "success": true,
                        "reason": null,
                        "message": "code is runnable"
                    }
                },
                "test_weights": {
                    "runnability_check": 0.07692307692307693
                }
            }
        }
    },
    {
        "0": {
            "code_0": {
                "code": "import pandas as pd\nimport numpy as np\nfrom sklearn.preprocessing import OneHotEncoder, StandardScaler\nfrom sklearn.model_selection import train_test_split\nimport keras\nfrom keras.models import Sequential\nfrom keras.layers import Dense\n\ndef beach_profile_model(train_file_path: str, test_file_path: str) -> dict:\n\n    # === Component: data_loader ===\n    def data_loader(train_path, test_path):\n        # Load the data from Excel files\n        train_data = pd.read_excel(train_path)\n        test_data = pd.read_excel(test_path)\n\n        # One-hot encode 'Dominant Wave Direction'\n        encoder = OneHotEncoder()\n        train_encoded = encoder.fit_transform(train_data[['Dominant Wave Direction']]).toarray()\n        test_encoded = encoder.transform(test_data[['Dominant Wave Direction']]).toarray()\n\n        # Collect all numerical columns that need normalization\n        numeric_features = ['x', 'y', 'Breaker Wave Height Hb', 'Deep Water Wave Height Hd', \n                            'Annual Mean Period', 'Annual Mean Spring Tidal Range', \n                            'Annual Mean Tidal Range', 'High Tide Sediment Settling Velocity', \n                            'Intertidal Slope', 'Kurtosis', 'Latitude', 'Longitude',\n                            'Mean Grain Size', 'Mean Grain Size (Mz)', 'Mean Wave Height', \n                            'Period', 'Profile Azimuth', 'Profile Length', \n                            'Relative Tidal Range', 'Skewness', 'Sorting Coefficient']\n\n        # Normalize numerical features\n        scaler = StandardScaler()\n        train_data[numeric_features] = scaler.fit_transform(train_data[numeric_features])\n        test_data[numeric_features] = scaler.transform(test_data[numeric_features])\n\n        # Combine normalized numerical features and encoded categorical features\n        train_processed_data = np.hstack((train_data[numeric_features].values, train_encoded))\n        test_processed_data = np.hstack((test_data[numeric_features].values, test_encoded))\n        \n        return train_processed_data, test_processed_data, train_data['y'].values, test_data['y'].values\n\n    # === Component: feature_engineer ===\n    def feature_engineer(data):\n        # Sample derived feature calculation: Energy = (Wave Height * Acceleration due to gravity * Wave Period)\n        # Simplified here for conceptual understanding\n        gravity = 9.81  # m/s^2\n        wave_energy = data[:, 2] * gravity * data[:, 14]  # Approximating using 'Breaker Wave Height Hb' and 'Period'\n        data = np.c_[data, wave_energy]  # Add new feature to the data\n        return data\n\n    # === Component: neural_network_model ===\n    def neural_network_model(input_shape):\n        model = Sequential()\n        model.add(Dense(64, input_dim=input_shape, activation='relu'))\n        model.add(Dense(32, activation='relu'))\n        model.add(Dense(1))  # Regression output layer\n        model.compile(optimizer='adam', loss='mean_squared_error')\n        return model\n\n    # === Component: train_and_evaluate_model ===\n    def train_and_evaluate_model(model, X_train, y_train, X_test, y_test):\n        # Split into training and validation for better generalization checking\n        X_tr, X_val, y_tr, y_val = train_test_split(X_train, y_train, test_size=0.2, random_state=42)\n\n        # Train the model\n        model.fit(X_tr, y_tr, epochs=100, batch_size=32, validation_data=(X_val, y_val), verbose=0)\n\n        # Evaluate the model\n        test_loss = model.evaluate(X_test, y_test, verbose=0)\n        return {'Test Loss': test_loss}\n\n    # Main process\n    # Load and preprocess the data\n    X_train, X_test, y_train, y_test = data_loader(train_file_path, test_file_path)\n\n    # Feature engineering\n    X_train = feature_engineer(X_train)\n    X_test = feature_engineer(X_test)\n\n    # Build the neural network model\n    model = neural_network_model(X_train.shape[1])\n\n    # Train and evaluate the model, returning evaluation results.\n    results = train_and_evaluate_model(model, X_train, y_train, X_test, y_test)\n\n    return results",
                "plan": "1. **Data Loading and Preprocessing**: Load training and test data from Excel files. One-hot encode the 'Dominant Wave Direction' column since it is categorical. Normalize numeric features using StandardScaler to stabilize the learning process.\n\n2. **Feature Engineering**: Create additional features based on existing ones. In this example, we derived a feature approximating wave energy which is added to the dataset.\n\n3. **Neural Network Model Definition**: A sequential neural network is defined with ReLU activation. It's designed to handle regression tasks, predicting sea level elevation.\n\n4. **Training and Evaluation**: Split the training data further into training and validation sets. Train the network and then evaluate it on the test set. The mean squared error of the test results is returned as an evaluation metric.\n\nEach component function corresponds to a logical section of the task, from loading data to model evaluation, which is tied together in the main function for execution.",
                "main_function_name": "beach_profile_model",
                "score": 0.12082436010328225,
                "pass_rate": 0.0,
                "pass_rate_score": 0.0,
                "prediction_score": 0.0,
                "pylint_score": 0.364,
                "radon_score": 0.8442436010328224,
                "test_case_results": {
                    "runnability_check": {
                        "success": false,
                        "reason": "main_func_compile_error",
                        "message": "Compilation Error: Traceback (most recent call last):\n  File \"d:\\anaconda3\\envs\\llm\\lib\\site-packages\\tensorflow\\python\\pywrap_tensorflow.py\", line 73, in <module>\n    from tensorflow.python._pywrap_tensorflow_internal import *\nImportError: DLL load failed while importing _pywrap_tensorflow_internal: 动态链接库(DLL)初始化例程失败。\n\n\nFailed to load the native TensorFlow runtime.\nSee https://www.tensorflow.org/install/errors for some common causes and solutions.\nIf you need help, create an issue at https://github.com/tensorflow/tensorflow/issues and include the entire stack trace above this error message."
                    }
                },
                "test_weights": {
                    "runnability_check": 0.007100591715976331
                }
            }
        },
        "1": {
            "code_0": {
                "code": "import pandas as pd\nimport numpy as np\nfrom sklearn.preprocessing import OneHotEncoder, StandardScaler\nfrom sklearn.model_selection import train_test_split\nimport torch\nimport torch.nn as nn\nimport torch.optim as optim\n\ndef beach_profile_model(train_file_path: str, test_file_path: str) -> dict:\n    # === Component: data_loader ===\n    def data_loader(train_path, test_path):\n        # Load the data from Excel files\n        train_data = pd.read_excel(train_path)\n        test_data = pd.read_excel(test_path)\n\n        # One-hot encode 'Dominant Wave Direction'\n        encoder = OneHotEncoder()\n        train_encoded = encoder.fit_transform(train_data[['Dominant Wave Direction']]).toarray()\n        test_encoded = encoder.transform(test_data[['Dominant Wave Direction']]).toarray()\n\n        # Collect all numerical columns that need normalization\n        numeric_features = ['x', 'Breaker Wave Height Hb', 'Deep Water Wave Height Hd', \n                            'Annual Mean Period', 'Annual Mean Spring Tidal Range', \n                            'Annual Mean Tidal Range', 'High Tide Sediment Settling Velocity', \n                            'Intertidal Slope', 'Kurtosis', 'Latitude', 'Longitude',\n                            'Mean Grain Size', 'Mean Grain Size (Mz)', 'Mean Wave Height', \n                            'Period', 'Profile Azimuth', 'Profile Length', \n                            'Relative Tidal Range', 'Skewness', 'Sorting Coefficient']\n\n        # Normalize numerical features\n        scaler = StandardScaler()\n        train_data[numeric_features] = scaler.fit_transform(train_data[numeric_features])\n        test_data[numeric_features] = scaler.transform(test_data[numeric_features])\n\n        # Combine normalized numerical features and encoded categorical features\n        train_processed_data = np.hstack((train_data[numeric_features].values, train_encoded))\n        test_processed_data = np.hstack((test_data[numeric_features].values, test_encoded))\n        \n        return train_processed_data, test_processed_data, train_data['y'].values, test_data['y'].values\n\n    # === Component: feature_engineer ===\n    def feature_engineer(data):\n        # Sample derived feature calculation: Energy = (Wave Height * Acceleration due to gravity * Wave Period)\n        # Simplified here for conceptual understanding\n        gravity = 9.81  # m/s^2\n        wave_energy = data[:, 2] * gravity * data[:, 14]  # Approximating using 'Breaker Wave Height Hb' and 'Period'\n        data = np.c_[data, wave_energy]  # Add new feature to the data\n        return data\n\n    # === Component: neural_network_model ===\n    class NeuralNetworkModel(nn.Module):\n        def __init__(self, input_shape):\n            super(NeuralNetworkModel, self).__init__()\n            self.layer1 = nn.Linear(input_shape, 64)\n            self.layer2 = nn.Linear(64, 32)\n            self.output_layer = nn.Linear(32, 1)\n\n        def forward(self, x):\n            x = torch.relu(self.layer1(x))\n            x = torch.relu(self.layer2(x))\n            x = self.output_layer(x)\n            return x\n\n    # === Component: train_and_evaluate_model ===\n    def train_and_evaluate_model(model, X_train, y_train, X_test, y_test, epochs=100):\n        # Convert data to PyTorch tensors\n        X_train_tensor = torch.tensor(X_train, dtype=torch.float32)\n        y_train_tensor = torch.tensor(y_train, dtype=torch.float32).view(-1, 1)\n        X_test_tensor = torch.tensor(X_test, dtype=torch.float32)\n        y_test_tensor = torch.tensor(y_test, dtype=torch.float32).view(-1, 1)\n\n        # Split into training and validation for better generalization checking\n        train_size = int(0.8 * len(X_train_tensor))\n        X_tr, X_val = torch.utils.data.random_split(X_train_tensor, [train_size, len(X_train_tensor) - train_size])\n        y_tr, y_val = torch.utils.data.random_split(y_train_tensor, [train_size, len(y_train_tensor) - train_size])\n\n        # Initialize the loss function and optimizer\n        criterion = nn.MSELoss()\n        optimizer = optim.Adam(model.parameters(), lr=0.001)\n\n        # Training loop\n        for epoch in range(epochs):\n            model.train()\n            optimizer.zero_grad()\n\n            # Forward pass\n            outputs = model(X_tr)\n            loss = criterion(outputs, y_tr)\n            loss.backward()\n            optimizer.step()\n\n            # Validation pass\n            model.eval()\n            val_outputs = model(X_val)\n            val_loss = criterion(val_outputs, y_val)\n\n            if epoch % 10 == 0:\n                print(f'Epoch {epoch}, Train Loss: {loss.item()}, Validation Loss: {val_loss.item()}')\n\n        # Evaluate the model on the test set\n        model.eval()\n        test_outputs = model(X_test_tensor)\n        test_loss = criterion(test_outputs, y_test_tensor)\n        return {'Test Loss': test_loss.item()}\n\n    # Main process\n    # Load and preprocess the data\n    X_train, X_test, y_train, y_test = data_loader(train_file_path, test_file_path)\n\n    # Feature engineering\n    X_train = feature_engineer(X_train)\n    X_test = feature_engineer(X_test)\n\n    # Build the neural network model\n    model = NeuralNetworkModel(X_train.shape[1])\n\n    # Train and evaluate the model, returning evaluation results.\n    results = train_and_evaluate_model(model, X_train, y_train, X_test, y_test)\n\n    return results",
                "plan": "1. **Data Loading**: The `data_loader` function reads in the data from Excel files and performs one-hot encoding on the 'Dominant Wave Direction' category. It also normalizes the specified numerical features for stability.\n   \n2. **Feature Engineering**: The `feature_engineer` function calculates derived features, such as wave energy, and appends these features to the dataset to enhance model performance.\n\n3. **Neural Network Model Construction**: A simple feedforward neural network is defined using PyTorch that consists of two hidden layers with ReLU activations. The 'NeuralNetworkModel' class handles creating the network.\n\n4. **Model Training and Evaluation**: The `train_and_evaluate_model` function trains the model using the training data and cross-validates on a separate validation set to avoid overfitting. The model's performance is evaluated on the test set, and the test loss is returned.\n   \n5. **Integration and Execution**: The main function integrates all components: loading data, feature engineering, model building, and model training. It ensures encapsulation of all steps for easy execution.",
                "main_function_name": "beach_profile_model",
                "score": 0.12925443004618803,
                "pass_rate": 0.0,
                "pass_rate_score": 0.0,
                "prediction_score": 0.0,
                "pylint_score": 0.5650000000000001,
                "radon_score": 0.7275443004618803,
                "test_case_results": {
                    "runnability_check": {
                        "success": false,
                        "reason": "test_failed",
                        "message": "code is not runnable, error: Traceback (most recent call last):\n  File \"<string>\", line 4, in test_function\nTypeError: beach_profile_model() missing 2 required positional arguments: 'train_file_path' and 'test_file_path'\n"
                    }
                },
                "test_weights": {
                    "runnability_check": 0.00109239872553482
                }
            }
        },
        "2": {
            "code_0": {
                "code": "import pandas as pd\nimport numpy as np\nfrom sklearn.preprocessing import OneHotEncoder, StandardScaler\nimport torch\nimport torch.nn as nn\nimport torch.optim as optim\n\ndef beach_profile_model() -> dict:\n    # === Component: data_loader ===\n    def data_loader():\n        train_path = \"beach_profile_data/processed_data/beachdata_train.xlsx\"\n        test_path = \"beach_profile_data/processed_data/beachdata_test.xlsx\"\n        \n        # Load the data from Excel files\n        train_data = pd.read_excel(train_path)\n        test_data = pd.read_excel(test_path)\n\n        # One-hot encode 'Dominant Wave Direction'\n        encoder = OneHotEncoder(sparse=False)\n        train_encoded = encoder.fit_transform(train_data[['Dominant Wave Direction']])\n        test_encoded = encoder.transform(test_data[['Dominant Wave Direction']])\n\n        # Collect all numerical columns that need normalization\n        numeric_features = ['x', 'Breaker Wave Height Hb', 'Deep Water Wave Height Hd', \n                            'Annual Mean Period', 'Annual Mean Spring Tidal Range', \n                            'Annual Mean Tidal Range', 'High Tide Sediment Settling Velocity', \n                            'Intertidal Slope', 'Kurtosis', 'Latitude', 'Longitude',\n                            'Mean Grain Size', 'Mean Grain Size (Mz)', 'Mean Wave Height', \n                            'Period', 'Profile Azimuth', 'Profile Length', \n                            'Relative Tidal Range', 'Skewness', 'Sorting Coefficient']\n\n        # Normalize numerical features\n        scaler = StandardScaler()\n        train_data[numeric_features] = scaler.fit_transform(train_data[numeric_features])\n        test_data[numeric_features] = scaler.transform(test_data[numeric_features])\n\n        # Combine normalized numerical features and encoded categorical features\n        train_processed_data = np.hstack((train_data[numeric_features].values, train_encoded))\n        test_processed_data = np.hstack((test_data[numeric_features].values, test_encoded))\n        \n        return train_processed_data, test_processed_data, train_data['y'].values, test_data['y'].values\n\n    # === Component: feature_engineer ===\n    def feature_engineer(data):\n        # Sample derived feature calculation: Energy = (Wave Height * Acceleration due to gravity * Wave Period)\n        # Simplified here for conceptual understanding\n        gravity = 9.81  # m/s^2\n        wave_energy = data[:, 2] * gravity * data[:, 14]  # Approximating using 'Breaker Wave Height Hb' and 'Period'\n        data = np.c_[data, wave_energy]  # Add new feature to the data\n        return data\n\n    # === Component: neural_network_model ===\n    class NeuralNetworkModel(nn.Module):\n        def __init__(self, input_shape):\n            super(NeuralNetworkModel, self).__init__()\n            self.layer1 = nn.Linear(input_shape, 64)\n            self.layer2 = nn.Linear(64, 32)\n            self.output_layer = nn.Linear(32, 1)\n\n        def forward(self, x):\n            x = torch.relu(self.layer1(x))\n            x = torch.relu(self.layer2(x))\n            x = self.output_layer(x)\n            return x\n\n    # === Component: train_and_evaluate_model ===\n    def train_and_evaluate_model(model, X_train, y_train, X_test, y_test, epochs=100):\n        # Convert data to PyTorch tensors\n        X_train_tensor = torch.tensor(X_train, dtype=torch.float32)\n        y_train_tensor = torch.tensor(y_train, dtype=torch.float32).view(-1, 1)\n        X_test_tensor = torch.tensor(X_test, dtype=torch.float32)\n        y_test_tensor = torch.tensor(y_test, dtype=torch.float32).view(-1, 1)\n\n        # Split into training and validation for better generalization checking\n        train_size = int(0.8 * len(X_train_tensor))\n        train_data, val_data = torch.utils.data.random_split(\n            dataset=list(zip(X_train_tensor, y_train_tensor)), \n            lengths=[train_size, len(X_train_tensor) - train_size]\n        )\n\n        # Initialize the loss function and optimizer\n        criterion = nn.MSELoss()\n        optimizer = optim.Adam(model.parameters(), lr=0.001)\n\n        # Training loop\n        for epoch in range(epochs):\n            model.train()\n            for X_batch, y_batch in torch.utils.data.DataLoader(train_data, batch_size=32, shuffle=True):\n                optimizer.zero_grad()\n                outputs = model(X_batch)\n                loss = criterion(outputs, y_batch)\n                loss.backward()\n                optimizer.step()\n\n            # Validate model\n            model.eval()\n            val_loss = 0\n            with torch.no_grad():\n                for X_batch, y_batch in torch.utils.data.DataLoader(val_data, batch_size=32):\n                    val_outputs = model(X_batch)\n                    val_loss += criterion(val_outputs, y_batch).item()\n            val_loss /= len(val_data)\n            \n            if epoch % 10 == 0:\n                print(f'Epoch {epoch}, Validation Loss: {val_loss}')\n\n        # Evaluate the model on the test set\n        model.eval()\n        with torch.no_grad():\n            test_outputs = model(X_test_tensor)\n            test_loss = criterion(test_outputs, y_test_tensor)\n        \n        return {'Test Loss': test_loss.item()}\n\n    # MAIN PROCESS\n    # Load and preprocess the data\n    X_train, X_test, y_train, y_test = data_loader()\n\n    # Feature engineering\n    X_train = feature_engineer(X_train)\n    X_test = feature_engineer(X_test)\n\n    # Build the neural network model\n    model = NeuralNetworkModel(input_shape=X_train.shape[1])\n\n    # Train and evaluate the model, returning evaluation results.\n    results = train_and_evaluate_model(model, X_train, y_train, X_test, y_test)\n\n    return results",
                "plan": "1. **Data Loading:** Load the training and test datasets from specified file paths. Use the `pandas` library to read the Excel files.\n\n2. **Data Preprocessing:**\n   - Encode the categorical 'Dominant Wave Direction' column using OneHotEncoder for compatibility with the neural network.\n   - Normalize numerical features like wave height and tidal range using StandardScaler for improved model performance.\n\n3. **Feature Engineering:** \n   - Derive new features if needed, such as estimating wave energy using physical formulas (optional for advanced feature analysis).\n   \n4. **Neural Network Model:**\n   - Define a basic neural network with three layers using PyTorch, designed for regression tasks.\n   - Use ReLU activation functions in the hidden layers.\n\n5. **Training and Evaluation:**\n   - Train the model using MSE Loss and the Adam optimizer.\n   - Include a training/validation split and evaluate model performance on the validation and test datasets.\n   \n6. **Result Return:** The function returns a dictionary containing the test loss for performance evaluation.\n\nThis plan follows the instructions for a complete and cohesive approach to solving the task while integrating all components.",
                "main_function_name": "beach_profile_model",
                "score": 0.8277408865797029,
                "pass_rate": 1.0,
                "pass_rate_score": 1.0,
                "prediction_score": 0.0,
                "pylint_score": 0.5730000000000001,
                "radon_score": 0.7044088657970299,
                "test_case_results": {
                    "runnability_check": {
                        "success": true,
                        "reason": null,
                        "message": "code is runnable"
                    }
                },
                "test_weights": {
                    "runnability_check": 0.00109239872553482
                }
            }
        }
    },
    {
        "0": {
            "code_0": {
                "code": "import pandas as pd\nfrom sklearn.model_selection import train_test_split\nfrom sklearn.preprocessing import StandardScaler, OneHotEncoder\nfrom sklearn.ensemble import RandomForestRegressor\nfrom sklearn.metrics import mean_absolute_error, r2_score\nfrom sklearn.compose import ColumnTransformer\nfrom sklearn.pipeline import Pipeline\nfrom sklearn.impute import SimpleImputer\nfrom sklearn.compose import make_column_selector as selector\n\ndef load_data(train_path: str, test_path: str):\n    \"\"\"\n    Loads the training and testing data from the specified Excel files.\n\n    Parameters:\n    - train_path: Path to the training data file.\n    - test_path: Path to the testing data file.\n\n    Returns:\n    - Two DataFrames for training and testing data respectively.\n    \"\"\"\n    train_df = pd.read_excel(train_path)\n    test_df = pd.read_excel(test_path)\n    return train_df, test_df\n\ndef preprocess_data(df: pd.DataFrame):\n    \"\"\"\n    Preprocess the data by encoding categorical features and scaling numerical features.\n\n    Parameters:\n    - df: DataFrame containing the data to preprocess.\n\n    Returns:\n    - Processed DataFrame with features ready for modeling.\n    - StandardScaler object used to scale numerical data.\n    \"\"\"\n    # Separate features and target variable 'y'\n    y = df['y']\n    X = df.drop('y', axis=1)\n\n    # Define transformations\n    # Categorical features transformation\n    categorical_transformer = Pipeline(steps=[\n        ('imputer', SimpleImputer(strategy='constant', fill_value='missing')),\n        ('onehot', OneHotEncoder(handle_unknown='ignore'))\n    ])\n    \n    # Numerical features transformation\n    numerical_transformer = Pipeline(steps=[\n        ('imputer', SimpleImputer(strategy='mean')),\n        ('scaler', StandardScaler())\n    ])\n    \n    # Combine transformations\n    preprocessor = ColumnTransformer(\n        transformers=[\n            ('num', numerical_transformer, selector(dtype_exclude=\"object\")),\n            ('cat', categorical_transformer, selector(dtype_include=\"object\"))\n        ])\n    \n    # Fit transform the data\n    X_processed = preprocessor.fit_transform(X)\n    \n    return X_processed, y, preprocessor\n\ndef bruun_model_prediction(L: float, h: float, B: float, delta_S: float):\n    \"\"\"\n    Returns the predicted shoreline retreat using the Bruun model.\n\n    Parameters:\n    - L: Active profile length.\n    - h: Depth of closure.\n    - B: Berm height.\n    - delta_S: Sea level rise.\n\n    Returns:\n    - Predicted shoreline retreat.\n    \"\"\"\n    return (L / (h + B)) * delta_S\n\ndef dean_model_prediction(x: float, A: float):\n    \"\"\"\n    Returns y(x) using the Dean model for beach profiles.\n\n    Parameters:\n    - x: Distance from origin.\n    - A: Fitting parameter.\n\n    Returns:\n    - Beach profile value, y(x).\n    \"\"\"\n    return A * x**(2/3)\n\ndef build_ml_model(X: pd.DataFrame, y: pd.Series):\n    \"\"\"\n    Builds and trains a machine learning regression model.\n\n    Parameters:\n    - X: DataFrame containing features.\n    - y: Series containing target variable.\n\n    Returns:\n    - Trained machine learning model.\n    \"\"\"\n    # Train the model\n    model = RandomForestRegressor(n_estimators=100, random_state=42)\n    model.fit(X, y)\n    return model\n\ndef evaluate_model(model, preprocessor, test_df: pd.DataFrame):\n    \"\"\"\n    Evaluates the trained model on the test dataset.\n\n    Parameters:\n    - model: Trained model.\n    - preprocessor: Preprocessor object for scaling.\n    - test_df: DataFrame containing the test data.\n\n    Returns:\n    - Dictionary containing evaluation metrics.\n    \"\"\"\n    X_test = test_df.drop('y', axis=1)\n    y_test = test_df['y']\n    X_test_processed = preprocessor.transform(X_test)\n    \n    # Predict and evaluate\n    predictions = model.predict(X_test_processed)\n    mae = mean_absolute_error(y_test, predictions)\n    r2 = r2_score(y_test, predictions)\n    \n    return {\"mae\": mae, \"r2\": r2}\n\ndef main():\n    # Load data\n    train_path = \"beach_profile_data/processed_data/beachdata_train.xlsx\"\n    test_path = \"beach_profile_data/processed_data/beachdata_test.xlsx\"\n    train_df, test_df = load_data(train_path, test_path)\n\n    # Preprocess data\n    X_train_processed, y_train, preprocessor = preprocess_data(train_df)\n\n    # Build and train ML model\n    model = build_ml_model(X_train_processed, y_train)\n\n    # Evaluate the model\n    evaluation_results = evaluate_model(model, preprocessor, test_df)\n    print(\"Model evaluation results:\", evaluation_results)",
                "plan": "Here is a detailed step-by-step explanation of the code's workflow:\n\n1. **Data Loading (load_data)**:\n   - The code begins by loading training and testing data files using pandas' `read_excel` method. This yields two DataFrames: one for training and another for testing.\n\n2. **Preprocessing Data (preprocess_data)**:\n   - Separate the target variable 'y' from the features.\n   - Define preprocessing pipelines for numerical and categorical features:\n     - Categorical data is imputed and then encoded using OneHotEncoder.\n     - Numerical data is imputed for missing values using a mean strategy and then standardized.\n   - Use ColumnTransformer to apply these pipelines to the respective data types.\n   - Transform the data and return the processed features, target variable, and the preprocessor.\n\n3. **Mathematical Models**:\n   - **Bruun Model (bruun_model_prediction)**: Calculates shoreline retreat based on rise in sea level, active profile length, depth of closure, and berm height.\n   - **Dean Model (dean_model_prediction)**: Provides a beach profile representation based on a given distance and a fitting parameter.\n\n4. **Building the ML Model (build_ml_model)**:\n   - A RandomForestRegressor is initialized and trained on the processed training data to predict sea level impacts.\n\n5. **Evaluating the Model (evaluate_model)**:\n   - Test data is processed using the same pipeline as training data.\n   - The trained model predicts outcomes on the test set, and evaluation metrics like MAE and R^2 are computed.\n\n6. **Main Function (main)**:\n   - Coordinates loading, preprocessing, model training, and evaluation.\n   - Loads dataset paths, preprocesses the data, builds, and evaluates the model.\n\nThe entire process is encapsulated within a `main()` function, ensuring nothing is executed unless the function is explicitly called.",
                "main_function_name": "main",
                "score": 0.8283602652897541,
                "pass_rate": 1.0,
                "pass_rate_score": 1.0,
                "prediction_score": 0.0,
                "pylint_score": 0.5559999999999999,
                "radon_score": 0.727602652897542,
                "test_case_results": {
                    "runnability_check": {
                        "success": true,
                        "reason": null,
                        "message": "code is runnable"
                    }
                },
                "test_weights": {
                    "runnability_check": 0.07692307692307693
                }
            }
        }
    },
    {
        "0": {
            "code_0": {
                "code": "import pandas as pd\nimport torch\nimport torch.nn as nn\nfrom sklearn.preprocessing import MinMaxScaler, StandardScaler\n\ndef read_data(train_path: str, test_path: str):\n    # Import the datasets from specified file paths\n    train_data = pd.read_excel(train_path)\n    test_data = pd.read_excel(test_path)\n    return train_data, test_data\n\ndef encode_categorical_features(df: pd.DataFrame):\n    # Encode categorical 'Dominant Wave Direction' using one-hot encoding\n    if 'Dominant Wave Direction' in df.columns:\n        df = pd.get_dummies(df, columns=['Dominant Wave Direction'], drop_first=True)\n    return df\n\ndef preprocess_features(df: pd.DataFrame):\n    # Identify columns for normalization and standardization\n    features_to_normalize = ['Annual Mean Period', 'Annual Mean Tidal Range', \n                             'Annual Mean Spring Tidal Range', 'Breaker Wave Height Hb', \n                             'Deep Water Wave Height Hd', 'Intertidal Slope', \n                             'Mean Grain Size', 'Latitude', 'Longitude']\n    \n    # Initialize scalers\n    min_max_scaler = MinMaxScaler()\n    standard_scaler = StandardScaler()\n    \n    # Normalize the selected features\n    df[features_to_normalize] = min_max_scaler.fit_transform(df[features_to_normalize])\n    \n    # Return the updated DataFrame\n    return df\n\ndef build_model():\n    class SeaLevelPredictor(nn.Module):\n        def __init__(self, input_dim, hidden_dim=64):\n            super(SeaLevelPredictor, self).__init__()\n            # Simple network layout\n            self.layer1 = nn.Linear(input_dim, hidden_dim)\n            self.relu = nn.ReLU()\n            self.layer2 = nn.Linear(hidden_dim, hidden_dim)\n            self.output = nn.Linear(hidden_dim, 1)\n\n        def forward(self, x):\n            x = self.relu(self.layer1(x))\n            x = self.relu(self.layer2(x))\n            x = self.output(x)\n            return x\n    \n    # Assuming the number of input features\n    input_dim = 27  # This should be dynamically determined from training dataset\n    model = SeaLevelPredictor(input_dim)\n    return model\n\ndef train_model(model, train_data, target='y'):\n    # Split data into features and target\n    X_train = train_data.drop(columns=[target])\n    y_train = train_data[target]\n    \n    # Convert to PyTorch tensors\n    X_train_tensor = torch.tensor(X_train.values, dtype=torch.float32)\n    y_train_tensor = torch.tensor(y_train.values, dtype=torch.float32).view(-1, 1)\n    \n    # Define loss function and optimizer\n    criterion = nn.MSELoss()\n    optimizer = torch.optim.Adam(model.parameters(), lr=0.001)\n    \n    num_epochs = 1000  # Define number of epochs\n    for epoch in range(num_epochs):\n        # Forward pass\n        outputs = model(X_train_tensor)\n        loss = criterion(outputs, y_train_tensor)\n        \n        # Backward pass and optimization\n        optimizer.zero_grad()\n        loss.backward()\n        optimizer.step()\n    \n    return None\n\ndef evaluate_model(model, test_data, target='y'):\n    # Split the test data into features and targets\n    X_test = test_data.drop(columns=[target])\n    y_test = test_data[target]\n    \n    # Convert to PyTorch tensors\n    X_test_tensor = torch.tensor(X_test.values, dtype=torch.float32)\n    y_test_tensor = torch.tensor(y_test.values, dtype=torch.float32).view(-1, 1)\n    \n    # Evaluate the model\n    model.eval()\n    with torch.no_grad():\n        predictions = model(X_test_tensor)\n        \n    # Calculate and return evaluation metrics\n    mse = nn.MSELoss()(predictions, y_test_tensor).item()\n    rmse = mse ** 0.5\n    return {\"RMSE\": rmse}\n\ndef main():\n    # Data paths\n    train_path = \"beach_profile_data/processed_data/beachdata_train.xlsx\"\n    test_path = \"beach_profile_data/processed_data/beachdata_test.xlsx\"\n\n    # Read datasets\n    train_data, test_data = read_data(train_path, test_path)\n\n    # Encode categorical features\n    train_data = encode_categorical_features(train_data)\n    test_data = encode_categorical_features(test_data)\n\n    # Preprocess features\n    train_data = preprocess_features(train_data)\n    test_data = preprocess_features(test_data)\n\n    # Build model\n    model = build_model()\n\n    # Train model with the processed training data\n    train_model(model, train_data)\n\n    # Evaluate the model with the processed test data\n    evaluation_metrics = evaluate_model(model, test_data)\n\n    return evaluation_metrics",
                "plan": "1. **read_data**: Loads the datasets from the specified paths using pandas and returns them as DataFrames for further processing.\n2. **encode_categorical_features**: Uses pandas' get_dummies function to one-hot encode the 'Dominant Wave Direction' categorical column to make it suitable for model input.\n3. **preprocess_features**: Applies MinMaxScaler to normalize the features that are crucial in the model, ensuring all numerical inputs are on a consistent scale for the neural network.\n4. **build_model**: Defines a simple three-layer neural network using PyTorch, structured to predict elevation ('y'). This uses fully connected layers and ReLU activation functions.\n5. **train_model**: Trains the model using a specified optimizer and loss function over defined epochs, adjusting weights through backpropagation.\n6. **evaluate_model**: Evaluates the trained model on the test dataset to compute RMSE as a metric of prediction error.\n7. **main**: Orchestrates the entire process, from reading and preprocessing data to building, training, and evaluating the model. Returns the evaluation metrics as the output.",
                "main_function_name": "main",
                "score": 0.1300987832521572,
                "pass_rate": 0.0,
                "pass_rate_score": 0.0,
                "prediction_score": 0.0,
                "pylint_score": 0.542,
                "radon_score": 0.758987832521572,
                "test_case_results": {
                    "runnability_check": {
                        "success": false,
                        "reason": "test_failed",
                        "message": "code is not runnable, error: Traceback (most recent call last):\n  File \"<string>\", line 4, in test_function\n  File \"<string>\", line 121, in main\n  File \"<string>\", line 62, in train_model\nTypeError: can't convert np.ndarray of type numpy.object_. The only supported types are: float64, float32, float16, complex64, complex128, int64, int32, int16, int8, uint64, uint32, uint16, uint8, and bool.\n"
                    }
                },
                "test_weights": {
                    "runnability_check": 0.007100591715976331
                }
            }
        },
        "1": {
            "code_0": {
                "code": "import pandas as pd\nimport torch\nimport torch.nn as nn\nfrom sklearn.preprocessing import MinMaxScaler, StandardScaler\n\ndef read_data(train_path: str, test_path: str):\n    # Import the datasets from specified file paths\n    train_data = pd.read_excel(train_path)\n    test_data = pd.read_excel(test_path)\n    return train_data, test_data\n\ndef encode_categorical_features(df: pd.DataFrame):\n    # Encode categorical 'Dominant Wave Direction' using one-hot encoding\n    if 'Dominant Wave Direction' in df.columns:\n        df = pd.get_dummies(df, columns=['Dominant Wave Direction'], drop_first=True)\n    return df\n\ndef preprocess_features(df: pd.DataFrame):\n    # Identify columns for normalization and standardization\n    features_to_normalize = ['Annual Mean Period', 'Annual Mean Tidal Range', \n                             'Annual Mean Spring Tidal Range', 'Breaker Wave Height Hb', \n                             'Deep Water Wave Height Hd', 'Intertidal Slope', \n                             'Mean Grain Size', 'Latitude', 'Longitude']\n    \n    # Filling NaNs with mean values for each column\n    df.fillna(df.mean(), inplace=True)\n    \n    # Initialize scalers\n    min_max_scaler = MinMaxScaler()\n    \n    # Normalize the selected features\n    df[features_to_normalize] = min_max_scaler.fit_transform(df[features_to_normalize])\n    \n    return df\n\ndef build_model(input_dim):\n    class SeaLevelPredictor(nn.Module):\n        def __init__(self, input_dim, hidden_dim=64):\n            super(SeaLevelPredictor, self).__init__()\n            self.layer1 = nn.Linear(input_dim, hidden_dim)\n            self.relu = nn.ReLU()\n            self.layer2 = nn.Linear(hidden_dim, hidden_dim)\n            self.output = nn.Linear(hidden_dim, 1)\n\n        def forward(self, x):\n            x = self.relu(self.layer1(x))\n            x = self.relu(self.layer2(x))\n            x = self.output(x)\n            return x\n    \n    model = SeaLevelPredictor(input_dim)\n    return model\n\ndef train_model(model, train_data, target='y'):\n    # Split data into features and target\n    X_train = train_data.drop(columns=[target])\n    y_train = train_data[target]\n    \n    # Convert to PyTorch tensors\n    X_train_tensor = torch.tensor(X_train.values, dtype=torch.float32)\n    y_train_tensor = torch.tensor(y_train.values, dtype=torch.float32).view(-1, 1)\n    \n    # Define loss function and optimizer\n    criterion = nn.MSELoss()\n    optimizer = torch.optim.Adam(model.parameters(), lr=0.001)\n    \n    num_epochs = 1000\n    for epoch in range(num_epochs):\n        model.train()\n        # Forward pass\n        outputs = model(X_train_tensor)\n        loss = criterion(outputs, y_train_tensor)\n        \n        # Backward pass and optimization\n        optimizer.zero_grad()\n        loss.backward()\n        optimizer.step()\n    \n    return None\n\ndef evaluate_model(model, test_data, target='y'):\n    # Split the test data into features and targets\n    X_test = test_data.drop(columns=[target])\n    y_test = test_data[target]\n    \n    # Convert to PyTorch tensors\n    X_test_tensor = torch.tensor(X_test.values, dtype=torch.float32)\n    y_test_tensor = torch.tensor(y_test.values, dtype=torch.float32).view(-1, 1)\n    \n    # Evaluate the model\n    model.eval()\n    with torch.no_grad():\n        predictions = model(X_test_tensor)\n        \n    # Calculate and return evaluation metrics\n    mse = nn.MSELoss()(predictions, y_test_tensor).item()\n    rmse = mse ** 0.5\n    return {\"RMSE\": rmse}\n\ndef main():\n    # Data paths\n    train_path = \"beach_profile_data/processed_data/beachdata_train.xlsx\"\n    test_path = \"beach_profile_data/processed_data/beachdata_test.xlsx\"\n\n    # Read datasets\n    train_data, test_data = read_data(train_path, test_path)\n\n    # Encode categorical features\n    train_data = encode_categorical_features(train_data)\n    test_data = encode_categorical_features(test_data)\n\n    # Preprocess features\n    train_data = preprocess_features(train_data)\n    test_data = preprocess_features(test_data)\n\n    # Build model\n    input_dim = train_data.drop(columns=['y']).shape[1]\n    model = build_model(input_dim)\n\n    # Train model with the processed training data\n    train_model(model, train_data)\n\n    # Evaluate the model with the processed test data\n    evaluation_metrics = evaluate_model(model, test_data)\n\n    return evaluation_metrics",
                "plan": "1. **Read Data**: Use `pandas` to read training and testing data from specified Excel files.\n2. **Encode Features**: Perform one-hot encoding on the 'Dominant Wave Direction' column to convert categorical data to numerical.\n3. **Preprocess Features**: Fill NaN values with the columns' mean, normalize specified features using `MinMaxScaler`, ensuring the data is in a suitable format for model input.\n4. **Build Model**: Define a neural network using PyTorch, tailored to the number of input features.\n5. **Train Model**: Train the neural network using the processed training data, employing MSE as the loss function and the Adam optimizer.\n6. **Evaluate Model**: Evaluate the model using RMSE on the test data after converting data to appropriate tensor format.\n7. **Main Function**: Organize the process flow with `main`, allowing the calling of all steps sequentially.",
                "main_function_name": "main",
                "score": 0.12796335651887625,
                "pass_rate": 0.0,
                "pass_rate_score": 0.0,
                "prediction_score": 0.0,
                "pylint_score": 0.534,
                "radon_score": 0.7456335651887624,
                "test_case_results": {
                    "runnability_check": {
                        "success": false,
                        "reason": "test_failed",
                        "message": "code is not runnable, error: Traceback (most recent call last):\n  File \"<string>\", line 4, in test_function\n  File \"<string>\", line 121, in main\n  File \"<string>\", line 60, in train_model\nTypeError: can't convert np.ndarray of type numpy.object_. The only supported types are: float64, float32, float16, complex64, complex128, int64, int32, int16, int8, uint64, uint32, uint16, uint8, and bool.\n"
                    }
                },
                "test_weights": {
                    "runnability_check": 0.001
                }
            }
        },
        "2": {
            "code_0": {
                "code": "import pandas as pd\nimport torch\nimport torch.nn as nn\nfrom sklearn.preprocessing import MinMaxScaler\nimport numpy as np\n\ndef read_data(train_path: str, test_path: str):\n    # Import the datasets from specified file paths\n    train_data = pd.read_excel(train_path)\n    test_data = pd.read_excel(test_path)\n    return train_data, test_data\n\ndef encode_categorical_features(df: pd.DataFrame):\n    # Encode categorical 'Dominant Wave Direction' using one-hot encoding\n    if 'Dominant Wave Direction' in df.columns:\n        df = pd.get_dummies(df, columns=['Dominant Wave Direction'], drop_first=True)\n    return df\n\ndef preprocess_features(df: pd.DataFrame):\n    # Identify columns for normalization\n    features_to_normalize = ['Annual Mean Period', 'Annual Mean Tidal Range', \n                             'Annual Mean Spring Tidal Range', 'Breaker Wave Height Hb', \n                             'Deep Water Wave Height Hd', 'Intertidal Slope', \n                             'Mean Grain Size', 'Latitude', 'Longitude']\n    \n    # Filling NaNs with mean values for each column\n    df.fillna(df.mean(numeric_only=True), inplace=True)\n    \n    # Initialize MinMaxScaler\n    min_max_scaler = MinMaxScaler()\n    \n    # Normalize the selected features\n    df[features_to_normalize] = min_max_scaler.fit_transform(df[features_to_normalize])\n    \n    # Convert all columns to float to avoid type errors\n    df = df.astype(np.float32)\n    \n    return df\n\ndef build_model(input_dim):\n    class SeaLevelPredictor(nn.Module):\n        def __init__(self, input_dim, hidden_dim=64):\n            super(SeaLevelPredictor, self).__init__()\n            self.layer1 = nn.Linear(input_dim, hidden_dim)\n            self.relu = nn.ReLU()\n            self.layer2 = nn.Linear(hidden_dim, hidden_dim)\n            self.output = nn.Linear(hidden_dim, 1)\n\n        def forward(self, x):\n            x = self.relu(self.layer1(x))\n            x = self.relu(self.layer2(x))\n            x = self.output(x)\n            return x\n    \n    model = SeaLevelPredictor(input_dim)\n    return model\n\ndef train_model(model, train_data, target='y'):\n    # Split data into features and target\n    X_train = train_data.drop(columns=[target])\n    y_train = train_data[target]\n    \n    # Convert to PyTorch tensors\n    X_train_tensor = torch.tensor(X_train.values, dtype=torch.float32)\n    y_train_tensor = torch.tensor(y_train.values, dtype=torch.float32).view(-1, 1)\n    \n    # Define loss function and optimizer\n    criterion = nn.MSELoss()\n    optimizer = torch.optim.Adam(model.parameters(), lr=0.001)\n    \n    num_epochs = 1000\n    for epoch in range(num_epochs):\n        model.train()\n        # Forward pass\n        outputs = model(X_train_tensor)\n        loss = criterion(outputs, y_train_tensor)\n        \n        # Backward pass and optimization\n        optimizer.zero_grad()\n        loss.backward()\n        optimizer.step()\n    \n    return None\n\ndef evaluate_model(model, test_data, target='y'):\n    # Split the test data into features and targets\n    X_test = test_data.drop(columns=[target])\n    y_test = test_data[target]\n    \n    # Convert to PyTorch tensors\n    X_test_tensor = torch.tensor(X_test.values, dtype=torch.float32)\n    y_test_tensor = torch.tensor(y_test.values, dtype=torch.float32).view(-1, 1)\n    \n    # Evaluate the model\n    model.eval()\n    with torch.no_grad():\n        predictions = model(X_test_tensor)\n        \n    # Calculate and return evaluation metrics\n    mse = nn.MSELoss()(predictions, y_test_tensor).item()\n    rmse = mse ** 0.5\n    return {\"RMSE\": rmse}\n\ndef main():\n    # Data paths\n    train_path = \"beach_profile_data/processed_data/beachdata_train.xlsx\"\n    test_path = \"beach_profile_data/processed_data/beachdata_test.xlsx\"\n\n    # Read datasets\n    train_data, test_data = read_data(train_path, test_path)\n\n    # Encode categorical features\n    train_data = encode_categorical_features(train_data)\n    test_data = encode_categorical_features(test_data)\n\n    # Preprocess features\n    train_data = preprocess_features(train_data)\n    test_data = preprocess_features(test_data)\n\n    # Build model\n    input_dim = train_data.drop(columns=['y']).shape[1]\n    model = build_model(input_dim)\n\n    # Train model with the processed training data\n    train_model(model, train_data)\n\n    # Evaluate the model with the processed test data\n    evaluation_metrics = evaluate_model(model, test_data)\n\n    return evaluation_metrics",
                "plan": "1. **Data Reading**: The script begins by reading train and test datasets from Excel files using `pandas.read_excel`.\n\n2. **Encoding Categorical Features**: The Dominant Wave Direction is encoded using one-hot encoding for numerical representation.\n\n3. **Data Preprocessing**:\n   - Identify features that require normalization.\n   - Fill missing values with column means using `fillna`.\n   - Normalize the selected features using `MinMaxScaler`.\n   - Convert the entire DataFrame to `float32` to ensure compatibility with PyTorch.\n\n4. **Model Building**: Define a simple feedforward neural network for predicting sea level elevations using `torch.nn`.\n\n5. **Model Training**: The model is trained using the training dataset converted to PyTorch tensors. The model performs forward and backward passes with the Adam optimizer for a specified number of epochs.\n\n6. **Model Evaluation**: The trained model is evaluated on the test dataset, calculating the RMSE as a metric to output the model's performance.\n\n7. **Main Function Execution**: The `main` function orchestrates the data loading, preprocessing, model creation, training, and evaluation processes.\n\n8. **Return Evaluation Metrics**: The final evaluation metrics (RMSE) are returned from the `main` function for further analysis or reporting.",
                "main_function_name": "main",
                "score": 0.1291425164889684,
                "pass_rate": 0.0,
                "pass_rate_score": 0.0,
                "prediction_score": 0.0,
                "pylint_score": 0.5469999999999999,
                "radon_score": 0.7444251648896842,
                "test_case_results": {
                    "runnability_check": {
                        "success": false,
                        "reason": "test_failed",
                        "message": "code is not runnable, error: Traceback (most recent call last):\n  File \"<string>\", line 4, in test_function\n  File \"<string>\", line 128, in main\n  File \"<string>\", line 97, in evaluate_model\n  File \"d:\\anaconda3\\envs\\llm\\lib\\site-packages\\torch\\nn\\modules\\module.py\", line 1532, in _wrapped_call_impl\n    return self._call_impl(*args, **kwargs)\n  File \"d:\\anaconda3\\envs\\llm\\lib\\site-packages\\torch\\nn\\modules\\module.py\", line 1541, in _call_impl\n    return forward_call(*args, **kwargs)\n  File \"<string>\", line 50, in forward\n  File \"d:\\anaconda3\\envs\\llm\\lib\\site-packages\\torch\\nn\\modules\\module.py\", line 1532, in _wrapped_call_impl\n    return self._call_impl(*args, **kwargs)\n  File \"d:\\anaconda3\\envs\\llm\\lib\\site-packages\\torch\\nn\\modules\\module.py\", line 1541, in _call_impl\n    return forward_call(*args, **kwargs)\n  File \"d:\\anaconda3\\envs\\llm\\lib\\site-packages\\torch\\nn\\modules\\linear.py\", line 116, in forward\n    return F.linear(input, self.weight, self.bias)\nRuntimeError: mat1 and mat2 shapes cannot be multiplied (242x26 and 27x64)\n"
                    }
                },
                "test_weights": {
                    "runnability_check": 0.001
                }
            }
        },
        "3": {
            "code_0": {
                "code": "import pandas as pd\nimport torch\nimport torch.nn as nn\nfrom sklearn.preprocessing import MinMaxScaler\nimport numpy as np\n\ndef read_data(train_path: str, test_path: str):\n    # Import the datasets from specified file paths\n    train_data = pd.read_excel(train_path)\n    test_data = pd.read_excel(test_path)\n    return train_data, test_data\n\ndef encode_categorical_features(df: pd.DataFrame):\n    # Encode categorical 'Dominant Wave Direction' using one-hot encoding\n    df = pd.get_dummies(df, columns=['Dominant Wave Direction'], drop_first=True)\n    return df\n\ndef preprocess_features(df: pd.DataFrame, scaler=None):\n    # Identify columns for normalization\n    features_to_normalize = ['Annual Mean Period', 'Annual Mean Tidal Range',\n                             'Annual Mean Spring Tidal Range', 'Breaker Wave Height Hb',\n                             'Deep Water Wave Height Hd', 'Intertidal Slope',\n                             'Mean Grain Size', 'Latitude', 'Longitude']\n\n    # Fill NaNs with mean values for each column\n    df.fillna(df.mean(numeric_only=True), inplace=True)\n\n    # Initialize MinMaxScaler if not provided\n    if scaler is None:\n        scaler = MinMaxScaler()\n\n    # Normalize the selected features\n    df[features_to_normalize] = scaler.fit_transform(df[features_to_normalize])\n\n    return df, scaler\n\ndef build_model(input_dim):\n    class SeaLevelPredictor(nn.Module):\n        def __init__(self, input_dim, hidden_dim=64):\n            super(SeaLevelPredictor, self).__init__()\n            self.layer1 = nn.Linear(input_dim, hidden_dim)\n            self.relu1 = nn.ReLU()\n            self.layer2 = nn.Linear(hidden_dim, hidden_dim)\n            self.relu2 = nn.ReLU()\n            self.output = nn.Linear(hidden_dim, 1)\n\n        def forward(self, x):\n            x = self.relu1(self.layer1(x))\n            x = self.relu2(self.layer2(x))\n            return self.output(x)\n    \n    model = SeaLevelPredictor(input_dim)\n    return model\n\ndef train_model(model, train_data, target='y'):\n    # Split data into features and target\n    X_train = train_data.drop(columns=[target])\n    y_train = train_data[target]\n    \n    # Convert to PyTorch tensors\n    X_train_tensor = torch.tensor(X_train.values, dtype=torch.float32)\n    y_train_tensor = torch.tensor(y_train.values, dtype=torch.float32).view(-1, 1)\n    \n    # Define loss function and optimizer\n    criterion = nn.MSELoss()\n    optimizer = torch.optim.Adam(model.parameters(), lr=0.001)\n    \n    num_epochs = 1000\n    for epoch in range(num_epochs):\n        model.train()\n        # Forward pass\n        outputs = model(X_train_tensor)\n        loss = criterion(outputs, y_train_tensor)\n        \n        # Backward pass and optimization\n        optimizer.zero_grad()\n        loss.backward()\n        optimizer.step()\n    \n    return model\n\ndef evaluate_model(model, test_data, target='y'):\n    # Split the test data into features and targets\n    X_test = test_data.drop(columns=[target])\n    y_test = test_data[target]\n    \n    # Convert to PyTorch tensors\n    X_test_tensor = torch.tensor(X_test.values, dtype=torch.float32)\n    y_test_tensor = torch.tensor(y_test.values, dtype=torch.float32).view(-1, 1)\n    \n    # Evaluate the model\n    model.eval()\n    with torch.no_grad():\n        predictions = model(X_test_tensor)\n        \n    # Calculate and return evaluation metrics\n    mse = nn.MSELoss()(predictions, y_test_tensor).item()\n    rmse = mse ** 0.5\n    return {\"RMSE\": rmse}\n\ndef main():\n    # Data paths\n    train_path = \"beach_profile_data/processed_data/beachdata_train.xlsx\"\n    test_path = \"beach_profile_data/processed_data/beachdata_test.xlsx\"\n\n    # Read datasets\n    train_data, test_data = read_data(train_path, test_path)\n\n    # Encode categorical features\n    train_data = encode_categorical_features(train_data)\n    test_data = encode_categorical_features(test_data)\n\n    # Preprocess features\n    train_data, scaler = preprocess_features(train_data)\n    test_data, _ = preprocess_features(test_data, scaler)\n\n    # Build model\n    input_dim = train_data.drop(columns=['y']).shape[1]\n    model = build_model(input_dim)\n\n    # Train model with the processed training data\n    model = train_model(model, train_data)\n\n    # Evaluate the model with the processed test data\n    evaluation_metrics = evaluate_model(model, test_data)\n\n    return evaluation_metrics",
                "plan": "1. **Data Reading**: Load the training and test datasets using provided file paths. This involves reading Excel files into pandas DataFrames.\n2. **Categorical Encoding**: Use one-hot encoding for the \"Dominant Wave Direction\" column and drop the first category to avoid multicollinearity.\n3. **Feature Preprocessing**: Fill any NaN values with column means, then normalize specified numerical features using MinMaxScaler to ensure all inputs are within the same range. This scaling is fitted on the training data and applied consistently to the test data using the same scaler.\n4. **Model Building**: Define and build a neural network using PyTorch, specifying input dimensions based on the processed features. The model consists of two hidden layers and an output layer.\n5. **Model Training**: Split the preprocessed training data into features and target label, convert to PyTorch tensors, and train the neural network using Mean Squared Error loss and the Adam optimizer over a set number of epochs.\n6. **Model Evaluation**: Evaluate the trained model using the test dataset, outputting the RMSE metric to quantify model accuracy.\n7. **Main Function**: Integrate and execute all components to read data, preprocess, build, train, and evaluate the model, returning the evaluation metrics.",
                "main_function_name": "main",
                "score": 0.13654199026372854,
                "pass_rate": 0.0,
                "pass_rate_score": 0.0,
                "prediction_score": 0.0,
                "pylint_score": 0.622,
                "radon_score": 0.7434199026372855,
                "test_case_results": {
                    "runnability_check": {
                        "success": false,
                        "reason": "test_failed",
                        "message": "code is not runnable, error: Traceback (most recent call last):\n  File \"<string>\", line 4, in test_function\n  File \"<string>\", line 122, in main\n  File \"<string>\", line 61, in train_model\nTypeError: can't convert np.ndarray of type numpy.object_. The only supported types are: float64, float32, float16, complex64, complex128, int64, int32, int16, int8, uint64, uint32, uint16, uint8, and bool.\n"
                    }
                },
                "test_weights": {
                    "runnability_check": 0.001
                }
            }
        },
        "4": {
            "code_0": {
                "code": "import pandas as pd\nimport torch\nimport torch.nn as nn\nfrom sklearn.preprocessing import MinMaxScaler, OneHotEncoder\nimport numpy as np\n\ndef read_data(train_path: str, test_path: str):\n    # Import the datasets from specified file paths\n    train_data = pd.read_excel(train_path)\n    test_data = pd.read_excel(test_path)\n    return train_data, test_data\n\ndef encode_categorical_features(df: pd.DataFrame):\n    # One-hot encode the categorical column 'Dominant Wave Direction'\n    encoder = OneHotEncoder(drop='first')\n    encoded_categories = encoder.fit_transform(df[['Dominant Wave Direction']]).toarray()\n    feature_labels = encoder.get_feature_names_out(['Dominant Wave Direction'])\n\n    df_encoded = pd.DataFrame(encoded_categories, columns=feature_labels)\n    df = pd.concat([df.drop(columns=['Dominant Wave Direction']), df_encoded], axis=1)\n    return df\n\ndef preprocess_features(df: pd.DataFrame, scaler=None):\n    # Identify features to normalize\n    features_to_normalize = ['Annual Mean Period', 'Annual Mean Tidal Range',\n                             'Annual Mean Spring Tidal Range', 'Breaker Wave Height Hb',\n                             'Deep Water Wave Height Hd', 'Intertidal Slope',\n                             'Mean Grain Size', 'Latitude', 'Longitude']\n\n    # Fill NaNs with the mean values of each column\n    df.fillna(df.mean(numeric_only=True), inplace=True)\n\n    # Initialize a MinMaxScaler if not provided\n    if scaler is None:\n        scaler = MinMaxScaler()\n\n    # Normalize the selected features\n    df[features_to_normalize] = scaler.fit_transform(df[features_to_normalize])\n\n    return df, scaler\n\ndef build_model(input_dim):\n    class SeaLevelPredictor(nn.Module):\n        def __init__(self, input_dim, hidden_dim=64):\n            super(SeaLevelPredictor, self).__init__()\n            self.layer1 = nn.Linear(input_dim, hidden_dim)\n            self.relu1 = nn.ReLU()\n            self.layer2 = nn.Linear(hidden_dim, hidden_dim)\n            self.relu2 = nn.ReLU()\n            self.output = nn.Linear(hidden_dim, 1)\n\n        def forward(self, x):\n            x = self.relu1(self.layer1(x))\n            x = self.relu2(self.layer2(x))\n            return self.output(x)\n    \n    model = SeaLevelPredictor(input_dim)\n    return model\n\ndef train_model(model, train_data, target='y'):\n    # Separate features and target variable\n    X_train = train_data.drop(columns=[target])\n    y_train = train_data[target]\n    \n    # Convert to PyTorch tensors ensuring the conversion is done for numerical formats\n    X_train_tensor = torch.tensor(X_train.values.astype(np.float32), dtype=torch.float32)\n    y_train_tensor = torch.tensor(y_train.values.astype(np.float32), dtype=torch.float32).view(-1, 1)\n    \n    # Define loss function and optimizer\n    criterion = nn.MSELoss()\n    optimizer = torch.optim.Adam(model.parameters(), lr=0.001)\n    \n    num_epochs = 1000\n    for epoch in range(num_epochs):\n        model.train()\n        # Forward pass\n        outputs = model(X_train_tensor)\n        loss = criterion(outputs, y_train_tensor)\n        \n        # Backward pass and optimization\n        optimizer.zero_grad()\n        loss.backward()\n        optimizer.step()\n    \n    return model\n\ndef evaluate_model(model, test_data, target='y'):\n    # Separate features and targets from the test dataset\n    X_test = test_data.drop(columns=[target])\n    y_test = test_data[target]\n    \n    # Convert to PyTorch tensors ensuring numerical types\n    X_test_tensor = torch.tensor(X_test.values.astype(np.float32), dtype=torch.float32)\n    y_test_tensor = torch.tensor(y_test.values.astype(np.float32), dtype=torch.float32).view(-1, 1)\n    \n    # Evaluate model performance\n    model.eval()\n    with torch.no_grad():\n        predictions = model(X_test_tensor)\n        \n    # Calculate and return evaluation metrics\n    mse = nn.MSELoss()(predictions, y_test_tensor).item()\n    rmse = mse ** 0.5\n    return {\"RMSE\": rmse}\n\ndef main():\n    # Data paths\n    train_path = \"beach_profile_data/processed_data/beachdata_train.xlsx\"\n    test_path = \"beach_profile_data/processed_data/beachdata_test.xlsx\"\n\n    # Read datasets\n    train_data, test_data = read_data(train_path, test_path)\n\n    # Encode categorical features\n    train_data = encode_categorical_features(train_data)\n    test_data = encode_categorical_features(test_data)\n\n    # Preprocess features\n    train_data, scaler = preprocess_features(train_data)\n    test_data, _ = preprocess_features(test_data, scaler)\n\n    # Build model\n    input_dim = train_data.drop(columns=['y']).shape[1]\n    model = build_model(input_dim)\n\n    # Train model with the processed training data\n    model = train_model(model, train_data)\n\n    # Evaluate the model with the processed test data\n    evaluation_metrics = evaluate_model(model, test_data)\n\n    return evaluation_metrics",
                "plan": "1. **Data Reading**: The script starts by reading in training and test data from specified Excel files using the pandas library.\n2. **Categorical Encoding**: Categorical features, specifically 'Dominant Wave Direction', are encoded using one-hot encoding to prepare them for use in the neural network.\n3. **Feature Preprocessing**: Certain features are selected for normalization to ensure numeric inputs to the model remain consistent in scale. The script also fills missing values with the mean of each feature to handle NaNs.\n4. **Model Construction**: A PyTorch neural network model is created with input dimensions based on the number of processed features. \n5. **Training the Model**: The model is trained with mean squared error loss and Adam optimizer over a predefined number of epochs.\n6. **Evaluation**: After training, the model is evaluated using RMSE as a metric on the test data set.\n7. **Integrated Main Function**: The entire workflow is encapsulated within the main function, which coordinates the data processing, model training, and evaluation seamlessly.",
                "main_function_name": "main",
                "score": 0.13757792862997237,
                "pass_rate": 0.0,
                "pass_rate_score": 0.0,
                "prediction_score": 0.0,
                "pylint_score": 0.641,
                "radon_score": 0.7347792862997234,
                "test_case_results": {
                    "runnability_check": {
                        "success": false,
                        "reason": "test_failed",
                        "message": "code is not runnable, error: Traceback (most recent call last):\n  File \"<string>\", line 4, in test_function\n  File \"<string>\", line 130, in main\n  File \"<string>\", line 99, in evaluate_model\n  File \"d:\\anaconda3\\envs\\llm\\lib\\site-packages\\torch\\nn\\modules\\module.py\", line 1532, in _wrapped_call_impl\n    return self._call_impl(*args, **kwargs)\n  File \"d:\\anaconda3\\envs\\llm\\lib\\site-packages\\torch\\nn\\modules\\module.py\", line 1541, in _call_impl\n    return forward_call(*args, **kwargs)\n  File \"<string>\", line 53, in forward\n  File \"d:\\anaconda3\\envs\\llm\\lib\\site-packages\\torch\\nn\\modules\\module.py\", line 1532, in _wrapped_call_impl\n    return self._call_impl(*args, **kwargs)\n  File \"d:\\anaconda3\\envs\\llm\\lib\\site-packages\\torch\\nn\\modules\\module.py\", line 1541, in _call_impl\n    return forward_call(*args, **kwargs)\n  File \"d:\\anaconda3\\envs\\llm\\lib\\site-packages\\torch\\nn\\modules\\linear.py\", line 116, in forward\n    return F.linear(input, self.weight, self.bias)\nRuntimeError: mat1 and mat2 shapes cannot be multiplied (242x26 and 27x64)\n"
                    }
                },
                "test_weights": {
                    "runnability_check": 0.001
                }
            }
        }
    },
    {
        "0": {
            "code_0": {
                "code": "import pandas as pd\nimport numpy as np\nfrom sklearn.preprocessing import StandardScaler, OneHotEncoder\nimport torch\nfrom torch import nn, optim\n\n# Component: load_data\ndef load_data(train_path: str, test_path: str) -> (pd.DataFrame, pd.DataFrame):\n    # Load training data from the Excel file\n    train_data = pd.read_excel(train_path)\n    \n    # Load test data from the Excel file\n    test_data = pd.read_excel(test_path)\n    \n    return train_data, test_data\n\n# Component: preprocess_data\ndef preprocess_data(df: pd.DataFrame) -> (pd.DataFrame, StandardScaler):\n    # One-hot encode 'Dominant Wave Direction'\n    encoder = OneHotEncoder()\n    encoded_wave_direction = encoder.fit_transform(df[['Dominant Wave Direction']]).toarray()\n    wave_direction_df = pd.DataFrame(encoded_wave_direction, columns=encoder.get_feature_names_out(['Dominant Wave Direction']))\n\n    # Drop original 'Dominant Wave Direction' column and merge the new one-hot encoded columns\n    df = df.drop(columns=['Dominant Wave Direction']).join(wave_direction_df)\n    \n    # Features to standardize\n    features_to_standardize = df.drop(columns=['y']).columns\n\n    # Separate target variable 'y' and features\n    X = df.drop(columns='y')\n    y = df['y']\n\n    # Normalize continuous features using StandardScaler\n    scaler = StandardScaler()\n    X_scaled = scaler.fit_transform(X[features_to_standardize])\n    X_scaled_df = pd.DataFrame(X_scaled, columns=features_to_standardize)\n\n    # Combine scaled features with encoded categorical features\n    processed_data = pd.concat([X_scaled_df, wave_direction_df, y.reset_index(drop=True)], axis=1)\n\n    return processed_data, scaler\n\n# Component: bruun_dean_insights\ndef bruun_dean_insights(df: pd.DataFrame) -> pd.DataFrame:\n    # Example of Bruun and Dean rule adding features\n    df['Bruun_Feature'] = df['x'] * 0.1  # Example feature using x distance\n    df['Dean_Feature'] = df['x'] ** (2/3)  # Dean profile h(y) = Ay^(2/3)\n\n    return df\n\n# Component: build_deep_learning_model\ndef build_deep_learning_model(input_size: int) -> nn.Module:\n    # Define a simple Feedforward Neural Network\n    class BeachProfileModel(nn.Module):\n        def __init__(self, input_size):\n            super(BeachProfileModel, self).__init__()\n            self.fc1 = nn.Linear(input_size, 128)\n            self.fc2 = nn.Linear(128, 64)\n            self.fc3 = nn.Linear(64, 1)\n        \n        def forward(self, x):\n            x = torch.relu(self.fc1(x))\n            x = torch.relu(self.fc2(x))\n            x = self.fc3(x)\n            return x\n    \n    model = BeachProfileModel(input_size)\n    return model\n\n# Component: train_model\ndef train_model(model: nn.Module, train_data: pd.DataFrame) -> nn.Module:\n    # Separate features and target variable\n    y_train = train_data['y'].values\n    X_train = train_data.drop(columns=['y']).values\n\n    # Convert data into PyTorch tensors\n    X_train_tensor = torch.tensor(X_train, dtype=torch.float32)\n    y_train_tensor = torch.tensor(y_train, dtype=torch.float32).view(-1, 1)\n\n    # Define loss function and optimizer\n    criterion = nn.MSELoss()\n    optimizer = optim.Adam(model.parameters(), lr=0.001)\n\n    # Training loop\n    epochs = 100\n    for epoch in range(epochs):\n        # Forward pass\n        outputs = model(X_train_tensor)\n        loss = criterion(outputs, y_train_tensor)\n        \n        # Backward pass and optimization\n        optimizer.zero_grad()\n        loss.backward()\n        optimizer.step()\n    \n    return model\n\n# Component: evaluate_model\ndef evaluate_model(model: nn.Module, test_data: pd.DataFrame, scaler: StandardScaler) -> dict:\n    # Prepare test data\n    X_test = test_data.drop(columns='y').values\n    y_test = test_data['y'].values\n\n    # Normalize test features\n    X_test_scaled = scaler.transform(X_test)\n    X_test_scaled_tensor = torch.tensor(X_test_scaled, dtype=torch.float32)\n\n    # Predict on test data\n    model.eval()\n    with torch.no_grad():\n        predictions = model(X_test_scaled_tensor).numpy().flatten()\n    \n    # Evaluate using MAE and RMSE\n    mae = np.mean(np.abs(predictions - y_test))\n    rmse = np.sqrt(np.mean((predictions - y_test)**2))\n\n    return {'mae': mae, 'rmse': rmse}\n\n# Main function integrating all components\ndef main() -> dict:\n    # File paths\n    train_path = \"beach_profile_data/processed_data/beachdata_train.xlsx\"\n    test_path = \"beach_profile_data/processed_data/beachdata_test.xlsx\"\n\n    # Step 1: Load Data\n    train_df, test_df = load_data(train_path, test_path)\n    \n    # Step 2: Preprocess Data\n    processed_train_df, scaler = preprocess_data(train_df)\n    processed_test_df, _ = preprocess_data(test_df)  # Only features, target not scaled\n\n    # Step 3: Integrate Bruun and Dean Insights\n    train_with_insights = bruun_dean_insights(processed_train_df)\n    test_with_insights = bruun_dean_insights(processed_test_df)\n\n    # Step 4: Build Deep Learning Model\n    input_size = train_with_insights.drop(columns='y').shape[1]\n    model = build_deep_learning_model(input_size)\n    \n    # Step 5: Train Model\n    trained_model = train_model(model, train_with_insights)\n\n    # Step 6: Evaluate Model\n    evaluation_results = evaluate_model(trained_model, test_with_insights, scaler)\n\n    return evaluation_results",
                "plan": "This script is structured to define a series of functions that represent each component of the task workflow, ultimately integrating them into a single runnable script.\n\nStep 1: **load_data**: This function reads training and testing datasets from specified paths using `pandas.read_excel()` and returns them as DataFrames.\n\nStep 2: **preprocess_data**: This component preprocesses the data by one-hot encoding categorical features and standardizing continuous features using `StandardScaler`. It separates the target variable 'y' and returns the processed DataFrame with a `StandardScaler` object for scaling test data.\n\nStep 3: **bruun_dean_insights**: It integrates domain knowledge from Bruun and Dean models by engineering new features that estimate the potential impact of sea level changes and equilibrium profile parameters based on the x distance.\n\nStep 4: **build_deep_learning_model**: This function sets up a PyTorch-based deep learning model. It defines a feedforward neural network model architecture, initialized using PyTorch's `torch.nn.Module`.\n\nStep 5: **train_model**: Trains the constructed deep model using the training data. This involves converting the data into PyTorch tensors, setting up a loss function and optimizer, and training over a defined number of epochs.\n\nStep 6: **evaluate_model**: This function evaluates the trained model's performance using the test dataset. It normalizes the test dataset using the previously fitted `StandardScaler`, makes predictions, and computes evaluation metrics (MAE and RMSE).\n\nFinally, the **main()** function executes all these components in sequence, starting from loading the data to evaluating the model, and returns a dictionary with evaluation metrics.",
                "main_function_name": "main",
                "score": 0.13329095153179582,
                "pass_rate": 0.0,
                "pass_rate_score": 0.0,
                "prediction_score": 0.0,
                "pylint_score": 0.595,
                "radon_score": 0.737909515317958,
                "test_case_results": {
                    "runnability_check": {
                        "success": false,
                        "reason": "test_failed",
                        "message": "code is not runnable, error: Traceback (most recent call last):\n  File \"<string>\", line 4, in test_function\n  File \"<string>\", line 145, in main\n  File \"<string>\", line 106, in evaluate_model\n  File \"d:\\anaconda3\\envs\\llm\\lib\\site-packages\\sklearn\\utils\\_set_output.py\", line 157, in wrapped\n    data_to_wrap = f(self, X, *args, **kwargs)\n  File \"d:\\anaconda3\\envs\\llm\\lib\\site-packages\\sklearn\\preprocessing\\_data.py\", line 1006, in transform\n    X = self._validate_data(\n  File \"d:\\anaconda3\\envs\\llm\\lib\\site-packages\\sklearn\\base.py\", line 626, in _validate_data\n    self._check_n_features(X, reset=reset)\n  File \"d:\\anaconda3\\envs\\llm\\lib\\site-packages\\sklearn\\base.py\", line 415, in _check_n_features\n    raise ValueError(\nValueError: X has 32 features, but StandardScaler is expecting 28 features as input.\n"
                    }
                },
                "test_weights": {
                    "runnability_check": 0.023668639053254437
                }
            }
        },
        "1": {
            "code_0": {
                "code": "import pandas as pd\nimport numpy as np\nfrom sklearn.preprocessing import StandardScaler, OneHotEncoder\nimport torch\nfrom torch import nn, optim\n\n# Load data from provided file paths\ndef load_data(train_path: str, test_path: str) -> (pd.DataFrame, pd.DataFrame):\n    # Load training data from Excel file\n    train_data = pd.read_excel(train_path)\n    # Load test data from Excel file\n    test_data = pd.read_excel(test_path)\n    return train_data, test_data\n\n# Preprocess data including encoding, scaling, and feature extraction\ndef preprocess_data(df: pd.DataFrame, is_training: bool = True, encoder: OneHotEncoder = None, scaler: StandardScaler = None) -> (pd.DataFrame, OneHotEncoder, StandardScaler):\n    # One-hot encode 'Dominant Wave Direction'\n    if is_training:\n        encoder = OneHotEncoder()\n        encoded_wave_direction = encoder.fit_transform(df[['Dominant Wave Direction']]).toarray()\n    else:\n        encoded_wave_direction = encoder.transform(df[['Dominant Wave Direction']]).toarray()\n\n    wave_direction_df = pd.DataFrame(encoded_wave_direction, columns=encoder.get_feature_names_out(['Dominant Wave Direction']))\n\n    # Drop original 'Dominant Wave Direction' column and merge the new one-hot encoded columns\n    df = df.drop(columns=['Dominant Wave Direction']).join(wave_direction_df)\n    \n    # Separate target variable 'y' and features\n    X = df.drop(columns='y')\n    y = df['y']\n\n    # Normalize continuous features using StandardScaler\n    if is_training:\n        scaler = StandardScaler()\n        X_scaled = scaler.fit_transform(X)\n    else:\n        X_scaled = scaler.transform(X)\n    \n    X_scaled_df = pd.DataFrame(X_scaled, columns=X.columns)\n\n    # Combine scaled features with encoded categorical features\n    processed_data = pd.concat([X_scaled_df, y.reset_index(drop=True)], axis=1)\n\n    return processed_data, encoder, scaler\n\n# Incorporate Bruun and Dean model insights into the dataset\ndef bruun_dean_insights(df: pd.DataFrame) -> pd.DataFrame:\n    # Example feature additions based on the Bruun and Dean rules\n    df['Bruun_Feature'] = df['x'] * 0.1  # Simplified example feature using x distance\n    df['Dean_Feature'] = df['x'] ** (2/3)  # Dean model: h(y) = Ay^(2/3)\n    return df\n\n# Construct a simple deep learning model for regression with PyTorch\ndef build_deep_learning_model(input_size: int) -> nn.Module:\n    # Define a simple Feedforward Neural Network\n    class BeachProfileModel(nn.Module):\n        def __init__(self, input_size):\n            super(BeachProfileModel, self).__init__()\n            self.fc1 = nn.Linear(input_size, 128)\n            self.fc2 = nn.Linear(128, 64)\n            self.fc3 = nn.Linear(64, 1)\n        \n        def forward(self, x):\n            x = torch.relu(self.fc1(x))\n            x = torch.relu(self.fc2(x))\n            x = self.fc3(x)\n            return x\n    \n    model = BeachProfileModel(input_size)\n    return model\n\n# Train the deep learning model using the provided training dataset\ndef train_model(model: nn.Module, train_data: pd.DataFrame) -> nn.Module:\n    # Separate features and target variable\n    y_train = train_data['y'].values\n    X_train = train_data.drop(columns=['y']).values\n\n    # Convert data into PyTorch tensors\n    X_train_tensor = torch.tensor(X_train, dtype=torch.float32)\n    y_train_tensor = torch.tensor(y_train, dtype=torch.float32).view(-1, 1)\n\n    # Define loss function and optimizer\n    criterion = nn.MSELoss()\n    optimizer = optim.Adam(model.parameters(), lr=0.001)\n\n    # Training loop\n    epochs = 100\n    for epoch in range(epochs):\n        # Forward pass\n        outputs = model(X_train_tensor)\n        loss = criterion(outputs, y_train_tensor)\n        \n        # Backward pass and optimization\n        optimizer.zero_grad()\n        loss.backward()\n        optimizer.step()\n    \n    return model\n\n# Evaluate the deep learning model using the test dataset\ndef evaluate_model(model: nn.Module, test_data: pd.DataFrame) -> dict:\n    # Separate features and target variable\n    y_test = test_data['y'].values\n    X_test = test_data.drop(columns='y').values\n\n    # Convert data into PyTorch tensors\n    X_test_tensor = torch.tensor(X_test, dtype=torch.float32)\n\n    # Predict on test data\n    model.eval()\n    with torch.no_grad():\n        predictions = model(X_test_tensor).numpy().flatten()\n    \n    # Compute evaluation metrics: MAE and RMSE\n    mae = np.mean(np.abs(predictions - y_test))\n    rmse = np.sqrt(np.mean((predictions - y_test)**2))\n\n    return {'mae': mae, 'rmse': rmse}\n\n# Main function integrating all other component functions\ndef main() -> dict:\n    # Define file paths for train and test data\n    train_path = \"beach_profile_data/processed_data/beachdata_train.xlsx\"\n    test_path = \"beach_profile_data/processed_data/beachdata_test.xlsx\"\n\n    # Load data\n    train_df, test_df = load_data(train_path, test_path)\n    \n    # Preprocess training data\n    processed_train_df, encoder, scaler = preprocess_data(train_df, is_training=True)\n\n    # Preprocess test data using the same encoder and scaler\n    processed_test_df, _, _ = preprocess_data(test_df, is_training=False, encoder=encoder, scaler=scaler)\n\n    # Integrate Bruun and Dean Insights into training and test data\n    train_with_insights = bruun_dean_insights(processed_train_df)\n    test_with_insights = bruun_dean_insights(processed_test_df)\n\n    # Build deep learning model\n    input_size = train_with_insights.drop(columns='y').shape[1]\n    model = build_deep_learning_model(input_size)\n    \n    # Train model on training data\n    trained_model = train_model(model, train_with_insights)\n\n    # Evaluate model on test data\n    evaluation_results = evaluate_model(trained_model, test_with_insights)\n\n    return evaluation_results",
                "plan": "1. **Load Data**: Read the data from specified Excel files containing training and testing datasets.\n   \n2. **Preprocess Data**:\n   - One-hot encode the categorical 'Dominant Wave Direction' feature for both datasets, ensuring that the same categories are used.\n   - Scale numerical features using `StandardScaler` to improve the stability and performance of the model during training and testing.\n   - Return the processed data-ready for model input, along with the encoder and scaler used.\n\n3. **Bruun and Dean Insights**:\n   - Integrate domain-specific insights by adding features inspired by the Bruun Rule and Dean models that can help improve model prediction by introducing domain knowledge.\n\n4. **Deep Learning Model Construction**: \n   - Define and build a simple three-layer feedforward neural network using PyTorch for predicting the 'y' values based on the input features.\n\n5. **Train Model**:\n   - Train the constructed model on the processed training data using mean squared error as the loss function, optimized using Adam optimizer.\n\n6. **Evaluate Model**:\n   - Assess the trained model's performance using test data, calculating mean absolute error (MAE) and root mean square error (RMSE) to measure accuracy and robustness.\n\n7. **Integrated Workflow (main)**: \n   - The main function coordinates the loading, preprocessing, feature extraction, model building, training, and evaluation with seamless transition and integration of all processes.",
                "main_function_name": "main",
                "score": 0.8320809868011947,
                "pass_rate": 1.0,
                "pass_rate_score": 1.0,
                "prediction_score": 0.0,
                "pylint_score": 0.593,
                "radon_score": 0.7278098680119467,
                "test_case_results": {
                    "runnability_check": {
                        "success": true,
                        "reason": null,
                        "message": "code is runnable"
                    }
                },
                "test_weights": {
                    "runnability_check": 0.023668639053254437
                }
            }
        }
    },
    {
        "0": {
            "code_0": {
                "code": "import pandas as pd\nimport torch\nimport torch.nn as nn\nimport torch.optim as optim\nfrom sklearn.preprocessing import StandardScaler, OneHotEncoder\nfrom sklearn.compose import ColumnTransformer\nfrom sklearn.pipeline import Pipeline\nfrom sklearn.model_selection import train_test_split\nfrom torch.utils.data import DataLoader, TensorDataset\nimport numpy as np\n\n# Component: load_data\ndef load_data(train_path: str, test_path: str):\n    # Load the training and test data from Excel files specified by the user\n    df_train = pd.read_excel(train_path)\n    df_test = pd.read_excel(test_path)\n\n    # Handle any missing values or erroneous data\n    df_train.fillna(df_train.mean(), inplace=True)\n    df_test.fillna(df_test.mean(), inplace=True)\n\n    return df_train, df_test\n\n# Component: preprocess_data\ndef preprocess_data(df: pd.DataFrame):\n    # Identify the features and target\n    features = df.drop(columns=['y'])\n    target = df['y']\n    \n    # Specify categorical and numerical features\n    categorical_features = ['Dominant Wave Direction']\n    numerical_features = features.columns.difference(categorical_features)\n\n    # Preprocess pipeline for data transformation\n    preprocessor = ColumnTransformer(transformers=[\n        ('num', StandardScaler(), numerical_features),\n        ('cat', OneHotEncoder(), categorical_features)\n    ])\n\n    # Apply transformation\n    features_transformed = preprocessor.fit_transform(features)\n\n    # Convert to DataFrame for consistency\n    features_transformed_df = pd.DataFrame(features_transformed)\n\n    return features_transformed_df, target\n\n# Component: build_neural_network_model\ndef build_neural_network_model(input_size: int):\n    # Define a simple feedforward neural network using PyTorch\n    class SeaLevelPredictor(nn.Module):\n        def __init__(self):\n            super(SeaLevelPredictor, self).__init__()\n            self.fc1 = nn.Linear(input_size, 64)\n            self.fc2 = nn.Linear(64, 32)\n            self.fc3 = nn.Linear(32, 1)  # Single output for regression\n\n        def forward(self, x):\n            x = torch.relu(self.fc1(x))\n            x = torch.relu(self.fc2(x))\n            x = self.fc3(x)\n            return x\n\n    # Instantiate the model\n    model = SeaLevelPredictor()\n    return model\n\n# Component: train_model\ndef train_model(model: nn.Module, train_loader: DataLoader, epochs: int):\n    # Set up loss function and optimizer\n    criterion = nn.MSELoss()\n    optimizer = optim.Adam(model.parameters(), lr=0.001)\n\n    # Train the model\n    model.train()\n    for epoch in range(epochs):\n        running_loss = 0.0\n        for i, (inputs, targets) in enumerate(train_loader):\n            optimizer.zero_grad()\n            outputs = model(inputs)\n            loss = criterion(outputs, targets)\n            loss.backward()\n            optimizer.step()\n            running_loss += loss.item()\n        print(f\"Epoch {epoch+1}/{epochs}, Loss: {running_loss/len(train_loader)}\")\n\n    return model, running_loss\n\n# Component: evaluate_model\ndef evaluate_model(model: nn.Module, test_loader: DataLoader):\n    # Set the model to evaluation mode\n    model.eval()\n    total_loss = 0.0\n    criterion = nn.MSELoss()\n    with torch.no_grad():\n        for inputs, targets in test_loader:\n            outputs = model(inputs)\n            loss = criterion(outputs, targets)\n            total_loss += loss.item()\n    \n    # Calculate RMSE\n    rmse = np.sqrt(total_loss / len(test_loader))\n    return rmse\n\n# Main function integrating all components\ndef main():\n    # Load the data\n    train_data, test_data = load_data(\n        \"beach_profile_data/processed_data/beachdata_train.xlsx\",\n        \"beach_profile_data/processed_data/beachdata_test.xlsx\"\n    )\n\n    # Preprocess the data\n    X_train, y_train = preprocess_data(train_data)\n    X_test, y_test = preprocess_data(test_data)\n\n    # Convert to PyTorch Dataset and Dataloaders\n    train_dataset = TensorDataset(torch.tensor(X_train.values, dtype=torch.float32), torch.tensor(y_train.values, dtype=torch.float32).view(-1, 1))\n    test_dataset = TensorDataset(torch.tensor(X_test.values, dtype=torch.float32), torch.tensor(y_test.values, dtype=torch.float32).view(-1, 1))\n\n    train_loader = DataLoader(train_dataset, batch_size=32, shuffle=True)\n    test_loader = DataLoader(test_dataset, batch_size=32, shuffle=False)\n\n    # Build and train the model\n    input_size = X_train.shape[1]\n    model = build_neural_network_model(input_size)\n    trained_model, _ = train_model(model, train_loader, epochs=100)\n\n    # Evaluate the model\n    rmse = evaluate_model(trained_model, test_loader)\n\n    print(f\"Model RMSE on test set: {rmse}\")\n    return rmse",
                "plan": "The code implements a complete solution for predicting sea level changes using the given data, integrating all specified components:\n\n1. **Data Loading**: The `load_data` function reads the Excel files containing training and test datasets using pandas. Missing values are handled by filling them with column means to maintain data integrity.\n\n2. **Data Preprocessing**: In `preprocess_data`, the necessary features are transformed using a pipeline that scales numerical features and one-hot encodes categorical features. We identify that 'Dominant Wave Direction' needs encoding and numerical features need standard scaling for effective training.\n\n3. **Model Construction**: A neural network architecture suitable for regression tasks is built in `build_neural_network_model`, featuring input, hidden, and output layers with ReLU activation functions. The output layer is set to predict a continuous value.\n\n4. **Model Training**: The `train_model` function sets up the MSE loss function and Adam optimizer. It iteratively trains the model over a fixed number of epochs (100) and keeps track of the loss to monitor model convergence. The training data is input through DataLoader batches.\n\n5. **Model Evaluation**: In `evaluate_model`, the trained model is assessed on the test dataset using RMSE as the metric. The model is put into evaluation mode to avoid gradient calculations.\n\n6. **Integration**: `main()` function orchestrates the data loading, preprocessing, model building, training, and evaluation procedures, ultimately returning the RMSE as the performance metric. \n\nThis structured approach ensures a holistic and systematic process from data ingestion to model evaluation, aligning with the deep learning task's requirements.",
                "main_function_name": "main",
                "score": 0.14379707877986403,
                "pass_rate": 0.0,
                "pass_rate_score": 0.0,
                "prediction_score": 0.0,
                "pylint_score": 0.722,
                "radon_score": 0.7159707877986401,
                "test_case_results": {
                    "runnability_check": {
                        "success": false,
                        "reason": "test_failed",
                        "message": "code is not runnable, error: Traceback (most recent call last):\n  File \"<string>\", line 4, in test_function\n  File \"<string>\", line 108, in main\n  File \"<string>\", line 19, in load_data\n  File \"d:\\anaconda3\\envs\\llm\\lib\\site-packages\\pandas\\core\\frame.py\", line 11338, in mean\n    result = super().mean(axis, skipna, numeric_only, **kwargs)\n  File \"d:\\anaconda3\\envs\\llm\\lib\\site-packages\\pandas\\core\\generic.py\", line 11978, in mean\n    return self._stat_function(\n  File \"d:\\anaconda3\\envs\\llm\\lib\\site-packages\\pandas\\core\\generic.py\", line 11935, in _stat_function\n    return self._reduce(\n  File \"d:\\anaconda3\\envs\\llm\\lib\\site-packages\\pandas\\core\\frame.py\", line 11207, in _reduce\n    res = df._mgr.reduce(blk_func)\n  File \"d:\\anaconda3\\envs\\llm\\lib\\site-packages\\pandas\\core\\internals\\managers.py\", line 1459, in reduce\n    nbs = blk.reduce(func)\n  File \"d:\\anaconda3\\envs\\llm\\lib\\site-packages\\pandas\\core\\internals\\blocks.py\", line 377, in reduce\n    result = func(self.values)\n  File \"d:\\anaconda3\\envs\\llm\\lib\\site-packages\\pandas\\core\\frame.py\", line 11139, in blk_func\n    return op(values, axis=axis, skipna=skipna, **kwds)\n  File \"d:\\anaconda3\\envs\\llm\\lib\\site-packages\\pandas\\core\\nanops.py\", line 147, in f\n    result = alt(values, axis=axis, skipna=skipna, **kwds)\n  File \"d:\\anaconda3\\envs\\llm\\lib\\site-packages\\pandas\\core\\nanops.py\", line 404, in new_func\n    result = func(values, axis=axis, skipna=skipna, mask=mask, **kwargs)\n  File \"d:\\anaconda3\\envs\\llm\\lib\\site-packages\\pandas\\core\\nanops.py\", line 720, in nanmean\n    the_sum = _ensure_numeric(the_sum)\n  File \"d:\\anaconda3\\envs\\llm\\lib\\site-packages\\pandas\\core\\nanops.py\", line 1678, in _ensure_numeric\n    raise TypeError(f\"Could not convert {x} to numeric\")\nTypeError: Could not convert ['ENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENENENENENENENENENENENENENENENENENENENENENENENENENENENENENENENENENENENENENENENENENENENENENENENENENENENENENENENENENENENENENENENENENENENENENENENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENENENENENENENENENENENENENENENENENENENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENEENENENENENENENENENENENENENENENENENENENENENENENENENENENENENENENENENENENENENENNENNENNENNENNENNENNENNENNENNENNENNENNENNENNENNENNENNENNENNENNENNEEEEEEEEEEEEEEEEEEEEE'] to numeric\n"
                    }
                },
                "test_weights": {
                    "runnability_check": 0.007100591715976331
                }
            }
        },
        "1": {
            "code_0": {
                "code": "import pandas as pd\nimport torch\nimport torch.nn as nn\nimport torch.optim as optim\nfrom sklearn.preprocessing import StandardScaler, OneHotEncoder\nfrom sklearn.compose import ColumnTransformer\nfrom sklearn.pipeline import Pipeline\nfrom sklearn.model_selection import train_test_split\nfrom torch.utils.data import DataLoader, TensorDataset\nimport numpy as np\n\n# Component: load_data\ndef load_data(train_path: str, test_path: str) -> tuple:\n    # Load the training and test data from Excel files specified by the user\n    df_train = pd.read_excel(train_path)\n    df_test = pd.read_excel(test_path)\n\n    # Handle missing values separately for numeric and categorical data\n    numeric_cols = df_train.select_dtypes(include=[np.number]).columns\n    df_train[numeric_cols] = df_train[numeric_cols].fillna(df_train[numeric_cols].mean())\n    df_test[numeric_cols] = df_test[numeric_cols].fillna(df_test[numeric_cols].mean())\n\n    # Fill categorical missing data with a placeholder\n    categorical_cols = df_train.select_dtypes(include=['object']).columns\n    df_train[categorical_cols] = df_train[categorical_cols].fillna('missing')\n    df_test[categorical_cols] = df_test[categorical_cols].fillna('missing')\n\n    return df_train, df_test\n\n# Component: preprocess_data\ndef preprocess_data(df: pd.DataFrame) -> tuple:\n    # Identify the features and target\n    features = df.drop(columns=['y'])\n    target = df['y']\n\n    # Specify categorical and numerical features\n    categorical_features = ['Dominant Wave Direction']\n    numerical_features = features.columns.difference(categorical_features)\n\n    # Preprocess pipeline for data transformation\n    preprocessor = ColumnTransformer(transformers=[\n        ('num', StandardScaler(), numerical_features),\n        ('cat', OneHotEncoder(), categorical_features)\n    ])\n\n    # Apply transformation\n    features_transformed = preprocessor.fit_transform(features)\n\n    # Convert to DataFrame for consistency\n    features_transformed_df = pd.DataFrame(features_transformed)\n\n    return features_transformed_df, target\n\n# Component: build_neural_network_model\ndef build_neural_network_model(input_size: int) -> nn.Module:\n    # Define a simple feedforward neural network using PyTorch\n    class SeaLevelPredictor(nn.Module):\n        def __init__(self):\n            super(SeaLevelPredictor, self).__init__()\n            self.fc1 = nn.Linear(input_size, 64)\n            self.fc2 = nn.Linear(64, 32)\n            self.fc3 = nn.Linear(32, 1)  # Single output for regression\n\n        def forward(self, x):\n            x = torch.relu(self.fc1(x))\n            x = torch.relu(self.fc2(x))\n            x = self.fc3(x)\n            return x\n\n    # Instantiate the model\n    model = SeaLevelPredictor()\n    return model\n\n# Component: train_model\ndef train_model(model: nn.Module, train_loader: DataLoader, epochs: int) -> tuple:\n    # Set up loss function and optimizer\n    criterion = nn.MSELoss()\n    optimizer = optim.Adam(model.parameters(), lr=0.001)\n\n    # Train the model\n    model.train()\n    for epoch in range(epochs):\n        running_loss = 0.0\n        for i, (inputs, targets) in enumerate(train_loader):\n            optimizer.zero_grad()\n            outputs = model(inputs)\n            loss = criterion(outputs, targets)\n            loss.backward()\n            optimizer.step()\n            running_loss += loss.item()\n        print(f\"Epoch {epoch+1}/{epochs}, Loss: {running_loss/len(train_loader)}\")\n\n    return model, running_loss\n\n# Component: evaluate_model\ndef evaluate_model(model: nn.Module, test_loader: DataLoader) -> float:\n    # Set the model to evaluation mode\n    model.eval()\n    total_loss = 0.0\n    criterion = nn.MSELoss()\n    with torch.no_grad():\n        for inputs, targets in test_loader:\n            outputs = model(inputs)\n            loss = criterion(outputs, targets)\n            total_loss += loss.item()\n    \n    # Calculate RMSE\n    rmse = np.sqrt(total_loss / len(test_loader))\n    return rmse\n\n# Main function integrating all components\ndef main():\n    # Load the data\n    train_data, test_data = load_data(\n        \"beach_profile_data/processed_data/beachdata_train.xlsx\",\n        \"beach_profile_data/processed_data/beachdata_test.xlsx\"\n    )\n\n    # Preprocess the data\n    X_train, y_train = preprocess_data(train_data)\n    X_test, y_test = preprocess_data(test_data)\n\n    # Convert to PyTorch Dataset and Dataloaders\n    train_dataset = TensorDataset(torch.tensor(X_train.values, dtype=torch.float32), torch.tensor(y_train.values, dtype=torch.float32).view(-1, 1))\n    test_dataset = TensorDataset(torch.tensor(X_test.values, dtype=torch.float32), torch.tensor(y_test.values, dtype=torch.float32).view(-1, 1))\n\n    train_loader = DataLoader(train_dataset, batch_size=32, shuffle=True)\n    test_loader = DataLoader(test_dataset, batch_size=32, shuffle=False)\n\n    # Build and train the model\n    input_size = X_train.shape[1]\n    model = build_neural_network_model(input_size)\n    trained_model, _ = train_model(model, train_loader, epochs=100)\n\n    # Evaluate the model\n    rmse = evaluate_model(trained_model, test_loader)\n\n    print(f\"Model RMSE on test set: {rmse}\")\n    return rmse",
                "plan": "1. **Data Loading**:\n   - Load data from Excel files for the training and test sets.\n   - Handle missing values separately for numeric and categorical columns to prevent errors in data type conversion.\n\n2. **Data Preprocessing**:\n   - Separate the target column 'y' from the feature set.\n   - Identify categorical and numerical features.\n   - Transform the data using a pipeline that scales numerical data and one-hot encodes categorical data.\n\n3. **Model Building**:\n   - Implement a feedforward neural network using PyTorch.\n   - The network consists of two hidden layers with ReLU activations and an output layer for regression.\n\n4. **Training the Model**:\n   - Use mean squared error as the loss function.\n   - Use the Adam optimizer for adjusting the model weights.\n   - Iterate over epochs to train the model and output the training loss.\n\n5. **Evaluating the Model**:\n   - Set the model to evaluation mode.\n   - Calculate the RMSE on the test data to assess model performance.\n\n6. **Main Integration**:\n   - Execute the entire process by loading data, preprocessing it, training the model, and evaluating it within the main function. This function is self-contained and does not require additional input.",
                "main_function_name": "main",
                "score": 0.14578099522985283,
                "pass_rate": 0.0,
                "pass_rate_score": 0.0,
                "prediction_score": 0.0,
                "pylint_score": 0.747,
                "radon_score": 0.7108099522985282,
                "test_case_results": {
                    "runnability_check": {
                        "success": false,
                        "reason": "test_failed",
                        "message": "code is not runnable, error: Traceback (most recent call last):\n  File \"<string>\", line 4, in test_function\n  File \"<string>\", line 136, in main\n  File \"<string>\", line 103, in evaluate_model\n  File \"d:\\anaconda3\\envs\\llm\\lib\\site-packages\\torch\\nn\\modules\\module.py\", line 1532, in _wrapped_call_impl\n    return self._call_impl(*args, **kwargs)\n  File \"d:\\anaconda3\\envs\\llm\\lib\\site-packages\\torch\\nn\\modules\\module.py\", line 1541, in _call_impl\n    return forward_call(*args, **kwargs)\n  File \"<string>\", line 65, in forward\n  File \"d:\\anaconda3\\envs\\llm\\lib\\site-packages\\torch\\nn\\modules\\module.py\", line 1532, in _wrapped_call_impl\n    return self._call_impl(*args, **kwargs)\n  File \"d:\\anaconda3\\envs\\llm\\lib\\site-packages\\torch\\nn\\modules\\module.py\", line 1541, in _call_impl\n    return forward_call(*args, **kwargs)\n  File \"d:\\anaconda3\\envs\\llm\\lib\\site-packages\\torch\\nn\\modules\\linear.py\", line 116, in forward\n    return F.linear(input, self.weight, self.bias)\nRuntimeError: mat1 and mat2 shapes cannot be multiplied (32x27 and 28x64)\n"
                    }
                },
                "test_weights": {
                    "runnability_check": 0.001
                }
            }
        },
        "2": {
            "code_0": {
                "code": "import pandas as pd\nimport torch\nimport torch.nn as nn\nimport torch.optim as optim\nfrom sklearn.preprocessing import StandardScaler, OneHotEncoder\nfrom sklearn.compose import ColumnTransformer\nfrom sklearn.pipeline import Pipeline\nfrom sklearn.model_selection import train_test_split\nfrom torch.utils.data import DataLoader, TensorDataset\nimport numpy as np\n\ndef load_data(train_path: str, test_path: str) -> tuple:\n    # Load the training and test data from Excel files\n    df_train = pd.read_excel(train_path)\n    df_test = pd.read_excel(test_path)\n\n    # Handle missing values\n    numeric_cols = df_train.select_dtypes(include=[np.number]).columns\n    df_train[numeric_cols] = df_train[numeric_cols].fillna(df_train[numeric_cols].mean())\n    df_test[numeric_cols] = df_test[numeric_cols].fillna(df_test[numeric_cols].mean())\n\n    # Fill categorical missing data with a placeholder\n    categorical_cols = df_train.select_dtypes(include=['object']).columns\n    df_train[categorical_cols] = df_train[categorical_cols].fillna('missing')\n    df_test[categorical_cols] = df_test[categorical_cols].fillna('missing')\n\n    return df_train, df_test\n\ndef preprocess_data(df: pd.DataFrame) -> tuple:\n    # Identify features and target\n    features = df.drop(columns=['y'])\n    target = df['y']\n\n    # Specify categorical and numerical features\n    categorical_features = ['Dominant Wave Direction']\n    numerical_features = features.columns.difference(categorical_features)\n\n    # Preprocessing pipeline\n    preprocessor = ColumnTransformer(transformers=[\n        ('num', StandardScaler(), numerical_features),\n        ('cat', OneHotEncoder(sparse=False), categorical_features)\n    ])\n\n    # Apply transformation\n    features_transformed = preprocessor.fit_transform(features)\n\n    # Convert to DataFrame\n    features_transformed_df = pd.DataFrame(features_transformed)\n\n    # Return processed features and target\n    return features_transformed_df, target\n\ndef build_neural_network_model(input_size: int) -> nn.Module:\n    # Define a feedforward neural network using PyTorch\n    class SeaLevelPredictor(nn.Module):\n        def __init__(self):\n            super(SeaLevelPredictor, self).__init__()\n            self.fc1 = nn.Linear(input_size, 64)\n            self.fc2 = nn.Linear(64, 32)\n            self.fc3 = nn.Linear(32, 1)  # Single output for regression\n\n        def forward(self, x):\n            x = torch.relu(self.fc1(x))\n            x = torch.relu(self.fc2(x))\n            x = self.fc3(x)\n            return x\n\n    # Instantiate the model\n    model = SeaLevelPredictor()\n    return model\n\ndef train_model(model: nn.Module, train_loader: DataLoader, epochs: int) -> tuple:\n    # Set up loss function and optimizer\n    criterion = nn.MSELoss()\n    optimizer = optim.Adam(model.parameters(), lr=0.001)\n\n    # Train the model\n    model.train()\n    for epoch in range(epochs):\n        running_loss = 0.0\n        for inputs, targets in train_loader:\n            optimizer.zero_grad()\n            outputs = model(inputs)\n            loss = criterion(outputs, targets)\n            loss.backward()\n            optimizer.step()\n            running_loss += loss.item()\n        print(f\"Epoch {epoch+1}/{epochs}, Loss: {running_loss/len(train_loader)}\")\n\n    return model, running_loss\n\ndef evaluate_model(model: nn.Module, test_loader: DataLoader) -> float:\n    # Set model to evaluation mode\n    model.eval()\n    total_loss = 0.0\n    criterion = nn.MSELoss()\n    with torch.no_grad():\n        for inputs, targets in test_loader:\n            outputs = model(inputs)\n            loss = criterion(outputs, targets)\n            total_loss += loss.item()\n    \n    # Calculate RMSE\n    rmse = np.sqrt(total_loss / len(test_loader))\n    return rmse\n\ndef main():\n    # Load the data\n    train_data, test_data = load_data(\n        \"beach_profile_data/processed_data/beachdata_train.xlsx\",\n        \"beach_profile_data/processed_data/beachdata_test.xlsx\"\n    )\n\n    # Preprocess the data\n    X_train, y_train = preprocess_data(train_data)\n    X_test, y_test = preprocess_data(test_data)\n\n    # Convert to PyTorch Dataset and DataLoaders\n    train_dataset = TensorDataset(torch.tensor(X_train.values, dtype=torch.float32), torch.tensor(y_train.values, dtype=torch.float32).view(-1, 1))\n    test_dataset = TensorDataset(torch.tensor(X_test.values, dtype=torch.float32), torch.tensor(y_test.values, dtype=torch.float32).view(-1, 1))\n\n    train_loader = DataLoader(train_dataset, batch_size=32, shuffle=True)\n    test_loader = DataLoader(test_dataset, batch_size=32, shuffle=False)\n\n    # Build and train the model\n    input_size = X_train.shape[1]  # Ensuring correct input size for the model\n    model = build_neural_network_model(input_size)\n    trained_model, _ = train_model(model, train_loader, epochs=100)\n\n    # Evaluate the model\n    rmse = evaluate_model(trained_model, test_loader)\n\n    print(f\"Model RMSE on test set: {rmse}\")\n    return rmse",
                "plan": "1. **Load Data**: The code uses `load_data()` to load Excel files into dataframes, handling missing numeric and categorical data separately by filling with mean values and a placeholder, respectively.\n\n2. **Preprocess Data**: In `preprocess_data()`, data is split into features and target. Categorical data is one-hot encoded, and numerical data is standardized using a pipeline. \n\n3. **Build Model**: `build_neural_network_model()` defines a neural network using PyTorch with input size matching the processed feature set's dimensions.\n\n4. **Train Model**: `train_model()` leverages DataLoader and trains the model on batches of input data, calculating loss with MSE and updating model parameters through backpropagation.\n\n5. **Evaluate Model**: `evaluate_model()` sets the model to evaluation mode and computes RMSE over the test dataset's predictions.\n\n6. **Main Workflow**:  Loads data, preprocesses it, constructs datasets for PyTorch, builds the model, trains it, and evaluates performance. RMSE is printed at the end.",
                "main_function_name": "main",
                "score": 0.14573319847010222,
                "pass_rate": 0.0,
                "pass_rate_score": 0.0,
                "prediction_score": 0.0,
                "pylint_score": 0.759,
                "radon_score": 0.6983319847010221,
                "test_case_results": {
                    "runnability_check": {
                        "success": false,
                        "reason": "test_failed",
                        "message": "code is not runnable, error: Traceback (most recent call last):\n  File \"<string>\", line 4, in test_function\n  File \"<string>\", line 131, in main\n  File \"<string>\", line 99, in evaluate_model\n  File \"d:\\anaconda3\\envs\\llm\\lib\\site-packages\\torch\\nn\\modules\\module.py\", line 1532, in _wrapped_call_impl\n    return self._call_impl(*args, **kwargs)\n  File \"d:\\anaconda3\\envs\\llm\\lib\\site-packages\\torch\\nn\\modules\\module.py\", line 1541, in _call_impl\n    return forward_call(*args, **kwargs)\n  File \"<string>\", line 63, in forward\n  File \"d:\\anaconda3\\envs\\llm\\lib\\site-packages\\torch\\nn\\modules\\module.py\", line 1532, in _wrapped_call_impl\n    return self._call_impl(*args, **kwargs)\n  File \"d:\\anaconda3\\envs\\llm\\lib\\site-packages\\torch\\nn\\modules\\module.py\", line 1541, in _call_impl\n    return forward_call(*args, **kwargs)\n  File \"d:\\anaconda3\\envs\\llm\\lib\\site-packages\\torch\\nn\\modules\\linear.py\", line 116, in forward\n    return F.linear(input, self.weight, self.bias)\nRuntimeError: mat1 and mat2 shapes cannot be multiplied (32x27 and 28x64)\n"
                    }
                },
                "test_weights": {
                    "runnability_check": 0.001
                }
            }
        },
        "3": {
            "code_0": {
                "code": "import pandas as pd\nimport torch\nimport torch.nn as nn\nimport torch.optim as optim\nfrom sklearn.preprocessing import StandardScaler, OneHotEncoder\nfrom sklearn.compose import ColumnTransformer\nfrom torch.utils.data import DataLoader, TensorDataset\nimport numpy as np\n\ndef load_data(train_path: str, test_path: str) -> tuple:\n    df_train = pd.read_excel(train_path)\n    df_test = pd.read_excel(test_path)\n\n    numeric_cols = df_train.select_dtypes(include=[np.number]).columns\n    df_train[numeric_cols] = df_train[numeric_cols].fillna(df_train[numeric_cols].mean())\n    df_test[numeric_cols] = df_test[numeric_cols].fillna(df_test[numeric_cols].mean())\n\n    categorical_cols = df_train.select_dtypes(include=['object']).columns\n    df_train[categorical_cols] = df_train[categorical_cols].fillna('missing')\n    df_test[categorical_cols] = df_test[categorical_cols].fillna('missing')\n\n    return df_train, df_test\n\ndef preprocess_data(df: pd.DataFrame) -> tuple:\n    # Separate features and target variable\n    features = df.drop(columns=['y'])\n    target = df['y']\n\n    # Define categorical and numerical features\n    categorical_features = ['Dominant Wave Direction']\n    numerical_features = features.columns.difference(categorical_features)\n\n    # Create the preprocessing pipeline\n    preprocessor = ColumnTransformer(transformers=[\n        ('num', StandardScaler(), numerical_features),\n        ('cat', OneHotEncoder(sparse=False, handle_unknown='ignore'), categorical_features)\n    ])\n\n    # Transform features\n    features_transformed = preprocessor.fit_transform(features)\n\n    return features_transformed, target, preprocessor\n\ndef build_neural_network_model(input_size: int) -> nn.Module:\n    class SeaLevelPredictor(nn.Module):\n        def __init__(self, input_size):\n            super(SeaLevelPredictor, self).__init__()\n            self.fc1 = nn.Linear(input_size, 64)\n            self.fc2 = nn.Linear(64, 32)\n            self.fc3 = nn.Linear(32, 1)\n\n        def forward(self, x):\n            x = torch.relu(self.fc1(x))\n            x = torch.relu(self.fc2(x))\n            x = self.fc3(x)\n            return x\n\n    model = SeaLevelPredictor(input_size)\n    return model\n\ndef train_model(model: nn.Module, train_loader: DataLoader, epochs: int) -> tuple:\n    criterion = nn.MSELoss()\n    optimizer = optim.Adam(model.parameters(), lr=0.001)\n\n    model.train()\n    for epoch in range(epochs):\n        running_loss = 0.0\n        for inputs, targets in train_loader:\n            optimizer.zero_grad()\n            outputs = model(inputs)\n            loss = criterion(outputs, targets)\n            loss.backward()\n            optimizer.step()\n            running_loss += loss.item()\n        print(f\"Epoch {epoch+1}/{epochs}, Loss: {running_loss/len(train_loader)}\")\n\n    return model\n\ndef evaluate_model(model: nn.Module, test_loader: DataLoader) -> float:\n    model.eval()\n    total_loss = 0.0\n    criterion = nn.MSELoss()\n    with torch.no_grad():\n        for inputs, targets in test_loader:\n            outputs = model(inputs)\n            loss = criterion(outputs, targets)\n            total_loss += loss.item()\n    \n    rmse = np.sqrt(total_loss / len(test_loader))\n    return rmse\n\ndef main():\n    train_data, test_data = load_data(\n        \"beach_profile_data/processed_data/beachdata_train.xlsx\",\n        \"beach_profile_data/processed_data/beachdata_test.xlsx\"\n    )\n\n    X_train, y_train, preprocessor = preprocess_data(train_data)\n    X_test, y_test, _ = preprocess_data(test_data)\n\n    X_train = torch.tensor(X_train, dtype=torch.float32)\n    y_train = torch.tensor(y_train.values, dtype=torch.float32).view(-1, 1)\n    X_test = torch.tensor(X_test, dtype=torch.float32)\n    y_test = torch.tensor(y_test.values, dtype=torch.float32).view(-1, 1)\n\n    train_dataset = TensorDataset(X_train, y_train)\n    test_dataset = TensorDataset(X_test, y_test)\n\n    train_loader = DataLoader(train_dataset, batch_size=32, shuffle=True)\n    test_loader = DataLoader(test_dataset, batch_size=32, shuffle=False)\n\n    model = build_neural_network_model(X_train.shape[1])\n    trained_model = train_model(model, train_loader, epochs=100)\n\n    rmse = evaluate_model(trained_model, test_loader)\n\n    print(f\"Model RMSE on test set: {rmse}\")\n    return rmse",
                "plan": "1. **Data Loading**:\n   - Load train and test data using Pandas from Excel files.\n   - Fill missing numerical data with their respective column means.\n   - Fill missing categorical data with a placeholder ('missing').\n\n2. **Data Preprocessing**:\n   - Separate features from the target.\n   - Identify numerical and categorical columns. Use `StandardScaler` for scaling numerical features and `OneHotEncoder` for encoding categorical features.\n   - Apply transformations and obtain preprocessed feature arrays.\n\n3. **Model Definition**:\n   - Define a neural network using PyTorch with appropriate layers and activation functions.\n   - Ensure the input size of the first layer matches the number of features.\n\n4. **Training**:\n   - Use mean squared error as the loss function and Adam optimizer for training.\n   - Train through multiple epochs with data loaded in batches via DataLoader.\n\n5. **Evaluation**:\n   - Evaluate the model on the test dataset using RMSE as the performance metric.\n\n6. **Main Execution**:\n   - Execute all steps from data loading to model evaluation under the `main` function, ensuring separation of logic and no user input required.",
                "main_function_name": "main",
                "score": 0.13429824401446708,
                "pass_rate": 0.0,
                "pass_rate_score": 0.0,
                "prediction_score": 0.0,
                "pylint_score": 0.771,
                "radon_score": 0.5719824401446707,
                "test_case_results": {
                    "runnability_check": {
                        "success": false,
                        "reason": "test_failed",
                        "message": "code is not runnable, error: Traceback (most recent call last):\n  File \"<string>\", line 4, in test_function\n  File \"<string>\", line 115, in main\n  File \"<string>\", line 85, in evaluate_model\n  File \"d:\\anaconda3\\envs\\llm\\lib\\site-packages\\torch\\nn\\modules\\module.py\", line 1532, in _wrapped_call_impl\n    return self._call_impl(*args, **kwargs)\n  File \"d:\\anaconda3\\envs\\llm\\lib\\site-packages\\torch\\nn\\modules\\module.py\", line 1541, in _call_impl\n    return forward_call(*args, **kwargs)\n  File \"<string>\", line 53, in forward\n  File \"d:\\anaconda3\\envs\\llm\\lib\\site-packages\\torch\\nn\\modules\\module.py\", line 1532, in _wrapped_call_impl\n    return self._call_impl(*args, **kwargs)\n  File \"d:\\anaconda3\\envs\\llm\\lib\\site-packages\\torch\\nn\\modules\\module.py\", line 1541, in _call_impl\n    return forward_call(*args, **kwargs)\n  File \"d:\\anaconda3\\envs\\llm\\lib\\site-packages\\torch\\nn\\modules\\linear.py\", line 116, in forward\n    return F.linear(input, self.weight, self.bias)\nRuntimeError: mat1 and mat2 shapes cannot be multiplied (32x27 and 28x64)\n"
                    }
                },
                "test_weights": {
                    "runnability_check": 0.001
                }
            }
        },
        "4": {
            "code_0": {
                "code": "import pandas as pd\nimport torch\nimport torch.nn as nn\nimport torch.optim as optim\nfrom sklearn.preprocessing import StandardScaler, OneHotEncoder\nfrom sklearn.compose import ColumnTransformer\nfrom torch.utils.data import DataLoader, TensorDataset\nimport numpy as np\n\ndef load_data(train_path: str, test_path: str) -> tuple:\n    df_train = pd.read_excel(train_path)\n    df_test = pd.read_excel(test_path)\n\n    numeric_cols = df_train.select_dtypes(include=[np.number]).columns\n    df_train[numeric_cols] = df_train[numeric_cols].fillna(df_train[numeric_cols].mean())\n    df_test[numeric_cols] = df_test[numeric_cols].fillna(df_test[numeric_cols].mean())\n\n    categorical_cols = df_train.select_dtypes(include=['object']).columns\n    df_train[categorical_cols] = df_train[categorical_cols].fillna('missing')\n    df_test[categorical_cols] = df_test[categorical_cols].fillna('missing')\n\n    return df_train, df_test\n\ndef preprocess_data(df: pd.DataFrame, preprocessor=None) -> tuple:\n    # Separate features and target variable\n    features = df.drop(columns=['y'])\n    target = df['y']\n\n    # Define categorical and numerical features\n    categorical_features = ['Dominant Wave Direction']\n    numerical_features = features.columns.difference(categorical_features)\n\n    # Create or use the provided preprocessing pipeline\n    if preprocessor is None:\n        preprocessor = ColumnTransformer(transformers=[\n            ('num', StandardScaler(), numerical_features),\n            ('cat', OneHotEncoder(sparse=False, handle_unknown='ignore'), categorical_features)\n        ])\n\n    # Transform features\n    features_transformed = preprocessor.fit_transform(features)\n\n    return features_transformed, target, preprocessor\n\ndef build_neural_network_model(input_size: int) -> nn.Module:\n    # Define the neural network architecture\n    class SeaLevelPredictor(nn.Module):\n        def __init__(self, input_size):\n            super(SeaLevelPredictor, self).__init__()\n            self.fc1 = nn.Linear(input_size, 64)\n            self.fc2 = nn.Linear(64, 32)\n            self.fc3 = nn.Linear(32, 1)\n\n        def forward(self, x):\n            x = torch.relu(self.fc1(x))\n            x = torch.relu(self.fc2(x))\n            x = self.fc3(x)\n            return x\n\n    model = SeaLevelPredictor(input_size)\n    return model\n\ndef train_model(model: nn.Module, train_loader: DataLoader, epochs: int) -> tuple:\n    # Set loss function and optimizer\n    criterion = nn.MSELoss()\n    optimizer = optim.Adam(model.parameters(), lr=0.001)\n\n    # Training the model\n    model.train()\n    for epoch in range(epochs):\n        running_loss = 0.0\n        for inputs, targets in train_loader:\n            optimizer.zero_grad()\n            outputs = model(inputs)\n            loss = criterion(outputs, targets)\n            loss.backward()\n            optimizer.step()\n            running_loss += loss.item()\n        print(f\"Epoch {epoch+1}/{epochs}, Loss: {running_loss/len(train_loader)}\")\n\n    return model\n\ndef evaluate_model(model: nn.Module, test_loader: DataLoader) -> float:\n    model.eval()\n    total_loss = 0.0\n    criterion = nn.MSELoss()\n    with torch.no_grad():\n        for inputs, targets in test_loader:\n            outputs = model(inputs)\n            loss = criterion(outputs, targets)\n            total_loss += loss.item()\n\n    # Calculate RMSE\n    rmse = np.sqrt(total_loss / len(test_loader))\n    return rmse\n\ndef main():\n    # Load and preprocess the data\n    train_data, test_data = load_data(\n        \"beach_profile_data/processed_data/beachdata_train.xlsx\",\n        \"beach_profile_data/processed_data/beachdata_test.xlsx\"\n    )\n\n    # Preprocess training and testing data\n    X_train, y_train, preprocessor = preprocess_data(train_data)\n    X_test, y_test, _ = preprocess_data(test_data, preprocessor)\n\n    # Convert to PyTorch tensors\n    X_train = torch.tensor(X_train, dtype=torch.float32)\n    y_train = torch.tensor(y_train.values, dtype=torch.float32).view(-1, 1)\n    X_test = torch.tensor(X_test, dtype=torch.float32)\n    y_test = torch.tensor(y_test.values, dtype=torch.float32).view(-1, 1)\n\n    # Create data loaders\n    train_dataset = TensorDataset(X_train, y_train)\n    test_dataset = TensorDataset(X_test, y_test)\n\n    train_loader = DataLoader(train_dataset, batch_size=32, shuffle=True)\n    test_loader = DataLoader(test_dataset, batch_size=32, shuffle=False)\n\n    # Build the model using correct input size\n    model = build_neural_network_model(X_train.shape[1])\n    trained_model = train_model(model, train_loader, epochs=100)\n\n    # Evaluate the model\n    rmse = evaluate_model(trained_model, test_loader)\n    print(f\"Model RMSE on test set: {rmse}\")\n    return rmse",
                "plan": "1. **Data Loading**: Read the training and testing datasets using `pandas`. Fill any missing numerical values with the column mean, and missing categorical values with 'missing'.\n\n2. **Data Preprocessing**: \n   - Separate the dataset into features and target variable `y`.\n   - Identify categorical and numerical features.\n   - Standardize numerical features and encode categorical features using `ColumnTransformer`.\n   - Transform the feature set into a suitable format using the preprocessing pipeline.\n\n3. **Neural Network Model**:\n   - Define a neural network with three fully connected layers. The size of the input layer is determined by the number of processed features.\n   - Ensure the layer dimensions are correct to prevent dimensionality mismatches.\n\n4. **Model Training**:\n   - Use the mean squared error loss function and the Adam optimizer.\n   - Train the model for a specified number of epochs, printing the loss at each epoch.\n\n5. **Model Evaluation**:\n   - Evaluate the trained model using a separate test dataset.\n   - Calculate and print the RMSE to assess model performance.\n\n6. **Integration**:\n   - The `main()` function integrates all the components, handling data loading, preprocessing, model training, and evaluation without requiring any user input.",
                "main_function_name": "main",
                "score": 0.14493102686552972,
                "pass_rate": 0.0,
                "pass_rate_score": 0.0,
                "prediction_score": 0.0,
                "pylint_score": 0.798,
                "radon_score": 0.6513102686552972,
                "test_case_results": {
                    "runnability_check": {
                        "success": false,
                        "reason": "test_failed",
                        "message": "code is not runnable, error: Traceback (most recent call last):\n  File \"<string>\", line 4, in test_function\n  File \"<string>\", line 126, in main\n  File \"<string>\", line 89, in evaluate_model\n  File \"d:\\anaconda3\\envs\\llm\\lib\\site-packages\\torch\\nn\\modules\\module.py\", line 1532, in _wrapped_call_impl\n    return self._call_impl(*args, **kwargs)\n  File \"d:\\anaconda3\\envs\\llm\\lib\\site-packages\\torch\\nn\\modules\\module.py\", line 1541, in _call_impl\n    return forward_call(*args, **kwargs)\n  File \"<string>\", line 55, in forward\n  File \"d:\\anaconda3\\envs\\llm\\lib\\site-packages\\torch\\nn\\modules\\module.py\", line 1532, in _wrapped_call_impl\n    return self._call_impl(*args, **kwargs)\n  File \"d:\\anaconda3\\envs\\llm\\lib\\site-packages\\torch\\nn\\modules\\module.py\", line 1541, in _call_impl\n    return forward_call(*args, **kwargs)\n  File \"d:\\anaconda3\\envs\\llm\\lib\\site-packages\\torch\\nn\\modules\\linear.py\", line 116, in forward\n    return F.linear(input, self.weight, self.bias)\nRuntimeError: mat1 and mat2 shapes cannot be multiplied (32x27 and 28x64)\n"
                    }
                },
                "test_weights": {
                    "runnability_check": 0.001
                }
            }
        }
    },
    {
        "0": {
            "code_0": {
                "code": "import pandas as pd\nimport numpy as np\nimport torch\nimport torch.nn as nn\nimport torch.optim as optim\nfrom sklearn.preprocessing import StandardScaler, OneHotEncoder\nfrom sklearn.metrics import mean_squared_error\n\n# Load the Excel datasets and prepare them for subsequent prediction tasks.\ndef load_data(train_path: str, test_path: str):\n    # Read the train and test data from the specified paths using pandas\n    train_df = pd.read_excel(train_path)\n    test_df = pd.read_excel(test_path)\n    # Return the DataFrame containing training data and testing data\n    return train_df, test_df\n\n# Preprocess the data by handling missing values, encoding categorical features, and standardizing numerical features.\ndef preprocess_data(data: pd.DataFrame):\n    # Handle missing values by dropping rows with missing target values 'y'\n    data = data.dropna(subset=['y'])\n\n    # One-hot encode the 'Dominant Wave Direction' column\n    wave_encoder = OneHotEncoder(sparse=False, handle_unknown='ignore')\n    encoded_wave_dir = wave_encoder.fit_transform(data[['Dominant Wave Direction']])\n    wave_dir_df = pd.DataFrame(encoded_wave_dir, columns=wave_encoder.get_feature_names_out(['Dominant Wave Direction']))\n\n    # Drop the original categorical column and concatenate the new one-hot encoded columns\n    data = data.drop(columns=['Dominant Wave Direction']).reset_index(drop=True)\n    data = pd.concat([data, wave_dir_df], axis=1)\n\n    # Standardize numerical features\n    scaler = StandardScaler()\n    numerical_features = data.drop(columns=['y', 'x'])  # Exclude target and primary input\n    data[numerical_features.columns] = scaler.fit_transform(numerical_features)\n\n    # Return the preprocessed DataFrame\n    return data\n\n# Implement the Bruun Rule to calculate shoreline position changes based on input features.\ndef bruun_model(S: float, L: float, d: float, B: float):\n    if (d + B) == 0:\n        return 0\n    \n    # Calculate change in shoreline position using the Bruun Rule formula\n    delta_y = (S * L) / (d + B)\n    return delta_y\n\n# Develop and train a deep learning model to predict elevation based on a set of selected features.\ndef deep_learning_model(train_df: pd.DataFrame, test_df: pd.DataFrame):\n    # Define the model structure using PyTorch\n    class SimpleRegressor(nn.Module):\n        def __init__(self, input_dim):\n            super(SimpleRegressor, self).__init__()\n            self.linear1 = nn.Linear(input_dim, 64)\n            self.relu = nn.ReLU()\n            self.linear2 = nn.Linear(64, 1)\n\n        def forward(self, x):\n            x = self.linear1(x)\n            x = self.relu(x)\n            x = self.linear2(x)\n            return x\n    \n    # Prepare input and output data\n    X_train = train_df.drop(columns=['y']).values.astype(np.float32)\n    y_train = train_df['y'].values.astype(np.float32).reshape(-1, 1)\n    X_test = test_df.drop(columns=['y']).values.astype(np.float32)\n    y_test = test_df['y'].values.astype(np.float32).reshape(-1, 1)\n\n    # Initialize model, loss function and optimizer\n    model = SimpleRegressor(X_train.shape[1])\n    criterion = nn.MSELoss()\n    optimizer = optim.Adam(model.parameters(), lr=0.001)\n\n    # Model training\n    for epoch in range(1000):\n        model.train()\n        optimizer.zero_grad()\n        predictions = model(torch.from_numpy(X_train))\n        loss = criterion(predictions, torch.from_numpy(y_train))\n        loss.backward()\n        optimizer.step()\n\n    return model\n\n# Evaluate the trained deep learning model on the test dataset to assess prediction performance.\ndef evaluate_model(model: torch.nn.Module, test_df: pd.DataFrame):\n    # Prepare the input and true output data\n    X_test = test_df.drop(columns=['y']).values.astype(np.float32)\n    y_test = test_df['y'].values.astype(np.float32).reshape(-1, 1)\n\n    # Predict the target variable using the test data\n    model.eval()\n    with torch.no_grad():\n        predictions = model(torch.from_numpy(X_test)).numpy()\n\n    # Evaluate the model using RMSE\n    rmse = np.sqrt(mean_squared_error(y_test, predictions))\n\n    return rmse\n\ndef main():\n    # Load the dataset\n    train_df, test_df = load_data(\"beach_profile_data/processed_data/beachdata_train.xlsx\",\n                                  \"beach_profile_data/processed_data/beachdata_test.xlsx\")\n    \n    # Preprocess the dataset\n    train_df = preprocess_data(train_df)\n    test_df = preprocess_data(test_df)\n    \n    # Example usage of Bruun model (example values given)\n    bruunn_result = bruun_model(S=1.0, L=100.0, d=5.0, B=2.0)\n    \n    # Train the deep learning model\n    trained_model = deep_learning_model(train_df, test_df)\n    \n    # Evaluate the model\n    rmse = evaluate_model(trained_model, test_df)\n\n    return rmse",
                "plan": "1. **load_data**: This function loads the Excel data from the specified paths for training and test datasets using pandas. It returns two DataFrames, one for each dataset.\n\n2. **preprocess_data**: This function prepares the loaded data. It handles missing values by dropping any rows with missing 'y' values, encodes the categorical 'Dominant Wave Direction' using a OneHotEncoder, and standardizes the numerical features to improve the performance of the deep learning model.\n\n3. **bruun_model**: This function implements the Bruun Rule, providing a calculation of shoreline position change using the specified formula, given the rise in sea level, profile length, water depth, and berm height. This function returns the calculated change.\n\n4. **deep_learning_model**: Uses PyTorch to define and train a simple feedforward neural network to predict 'y' from the preprocessed feature set. The training loop runs for a fixed number of epochs with mean squared error as the loss function, optimized using Adam.\n\n5. **evaluate_model**: This evaluates the deep learning model on test data by predicting outcomes and calculating RMSE to assess prediction accuracy.\n\n6. **main**: This ties all functions into one workflow. The main function first loads and preprocesses data, applies the Bruun model for a sample calculation, trains the neural network, and evaluates its performance on test data, returning RMSE as the primary evaluation metric.",
                "main_function_name": "main",
                "score": 0.12942923879436877,
                "pass_rate": 0.0,
                "pass_rate_score": 0.0,
                "prediction_score": 0.0,
                "pylint_score": 0.557,
                "radon_score": 0.7372923879436877,
                "test_case_results": {
                    "runnability_check": {
                        "success": false,
                        "reason": "test_failed",
                        "message": "code is not runnable, error: Traceback (most recent call last):\n  File \"<string>\", line 4, in test_function\n  File \"<string>\", line 118, in main\n  File \"<string>\", line 95, in evaluate_model\n  File \"d:\\anaconda3\\envs\\llm\\lib\\site-packages\\torch\\nn\\modules\\module.py\", line 1532, in _wrapped_call_impl\n    return self._call_impl(*args, **kwargs)\n  File \"d:\\anaconda3\\envs\\llm\\lib\\site-packages\\torch\\nn\\modules\\module.py\", line 1541, in _call_impl\n    return forward_call(*args, **kwargs)\n  File \"<string>\", line 59, in forward\n  File \"d:\\anaconda3\\envs\\llm\\lib\\site-packages\\torch\\nn\\modules\\module.py\", line 1532, in _wrapped_call_impl\n    return self._call_impl(*args, **kwargs)\n  File \"d:\\anaconda3\\envs\\llm\\lib\\site-packages\\torch\\nn\\modules\\module.py\", line 1541, in _call_impl\n    return forward_call(*args, **kwargs)\n  File \"d:\\anaconda3\\envs\\llm\\lib\\site-packages\\torch\\nn\\modules\\linear.py\", line 116, in forward\n    return F.linear(input, self.weight, self.bias)\nRuntimeError: mat1 and mat2 shapes cannot be multiplied (242x27 and 28x64)\n"
                    }
                },
                "test_weights": {
                    "runnability_check": 0.001
                }
            }
        },
        "1": {
            "code_0": {
                "code": "import pandas as pd\nimport numpy as np\nimport torch\nimport torch.nn as nn\nimport torch.optim as optim\nfrom sklearn.preprocessing import StandardScaler, OneHotEncoder\nfrom sklearn.metrics import mean_squared_error\n\n# Load the Excel datasets and prepare them for subsequent prediction tasks.\ndef load_data(train_path: str, test_path: str):\n    # Read the train and test data from the specified paths using pandas\n    train_df = pd.read_excel(train_path)\n    test_df = pd.read_excel(test_path)\n    # Return the DataFrames containing training data and testing data\n    return train_df, test_df\n\n# Preprocess the data by handling missing values, encoding categorical features, and standardizing numerical features.\ndef preprocess_data(data: pd.DataFrame):\n    # Handle missing values by dropping rows with missing target values 'y'\n    data = data.dropna(subset=['y'])\n\n    # One-hot encode the 'Dominant Wave Direction' column\n    wave_encoder = OneHotEncoder(sparse=False, handle_unknown='ignore')\n    encoded_wave_dir = wave_encoder.fit_transform(data[['Dominant Wave Direction']])\n    wave_dir_df = pd.DataFrame(encoded_wave_dir, columns=wave_encoder.get_feature_names_out(['Dominant Wave Direction']))\n\n    # Drop the original categorical column and concatenate the new one-hot encoded columns\n    data = data.drop(columns=['Dominant Wave Direction']).reset_index(drop=True)\n    data = pd.concat([data, wave_dir_df], axis=1)\n\n    # Standardize numerical features\n    scaler = StandardScaler()\n    numerical_features = data.drop(columns=['y', 'x'])  # Exclude target and primary input\n    data[numerical_features.columns] = scaler.fit_transform(numerical_features)\n\n    # Return the preprocessed DataFrame\n    return data\n\n# Implement the Bruun Rule to calculate shoreline position changes based on input features.\ndef bruun_model(S: float, L: float, d: float, B: float):\n    if (d + B) == 0:\n        return 0\n    \n    # Calculate change in shoreline position using the Bruun Rule formula\n    delta_y = (S * L) / (d + B)\n    return delta_y\n\n# Develop and train a deep learning model to predict elevation based on a set of selected features.\ndef deep_learning_model(train_df: pd.DataFrame, test_df: pd.DataFrame):\n    # Define the model structure using PyTorch\n    class SimpleRegressor(nn.Module):\n        def __init__(self, input_dim):\n            super(SimpleRegressor, self).__init__()\n            self.linear1 = nn.Linear(input_dim, 64)\n            self.relu = nn.ReLU()\n            self.linear2 = nn.Linear(64, 1)\n\n        def forward(self, x):\n            x = self.linear1(x)\n            x = self.relu(x)\n            x = self.linear2(x)\n            return x\n\n    # Prepare input and output data\n    X_train = train_df.drop(columns=['y']).values.astype(np.float32)\n    y_train = train_df['y'].values.astype(np.float32).reshape(-1, 1)\n\n    # Align model input dimension with preprocessed feature count\n    input_dim = X_train.shape[1]\n    \n    # Initialize model, loss function and optimizer\n    model = SimpleRegressor(input_dim)\n    criterion = nn.MSELoss()\n    optimizer = optim.Adam(model.parameters(), lr=0.001)\n\n    # Model training\n    for epoch in range(1000):\n        model.train()\n        optimizer.zero_grad()\n        predictions = model(torch.from_numpy(X_train))\n        loss = criterion(predictions, torch.from_numpy(y_train))\n        loss.backward()\n        optimizer.step()\n\n    return model\n\n# Evaluate the trained deep learning model on the test dataset to assess prediction performance.\ndef evaluate_model(model: torch.nn.Module, test_df: pd.DataFrame):\n    # Prepare the input and true output data\n    X_test = test_df.drop(columns=['y']).values.astype(np.float32)\n    y_test = test_df['y'].values.astype(np.float32).reshape(-1, 1)\n\n    # Predict the target variable using the test data\n    model.eval()\n    with torch.no_grad():\n        predictions = model(torch.from_numpy(X_test)).numpy()\n\n    # Evaluate the model using RMSE\n    rmse = np.sqrt(mean_squared_error(y_test, predictions))\n\n    return rmse\n\ndef main():\n    # Load the dataset\n    train_df, test_df = load_data(\"beach_profile_data/processed_data/beachdata_train.xlsx\",\n                                  \"beach_profile_data/processed_data/beachdata_test.xlsx\")\n    \n    # Preprocess the dataset\n    train_df = preprocess_data(train_df)\n    test_df = preprocess_data(test_df)\n    \n    # Example usage of Bruun model (example values given)\n    bruunn_result = bruun_model(S=1.0, L=100.0, d=5.0, B=2.0)\n    \n    # Train the deep learning model\n    trained_model = deep_learning_model(train_df, test_df)\n    \n    # Evaluate the model\n    rmse = evaluate_model(trained_model, test_df)\n\n    return rmse",
                "plan": "The workflow of the code is as follows:\n\n1. **Data Loading**:\n   - `load_data()` function reads the Excel files using pandas and returns DataFrame instances for training and testing datasets.\n\n2. **Data Preprocessing**:\n   - `preprocess_data()` function handles missing values by dropping any rows with missing target 'y'.\n   - Categorical data, specifically 'Dominant Wave Direction', is one-hot encoded to make it suitable for numerical computations.\n   - Numerical features are standardized using `StandardScaler` to ensure that data input scales are more uniform, improving model performance.\n\n3. **Bruun Rule Implementation**:\n   - `bruun_model()` function provides a simple physical model calculation emulating shoreline position changes due to sea level rise. This isn't directly used in deep learning training but serves as a conceptual tool for understanding sea level effects.\n\n4. **Deep Learning Model**:\n   - A simple neural network is defined using PyTorch, consisting of an input layer, hidden layer with ReLU activation, and an output layer.\n   - The model is trained over 1000 epochs, predicting the elevation from input features excluding 'y' and using `MSELoss` as the criterion.\n\n5. **Model Evaluation**:\n   - Evaluates the model on the test set using the RMSE metric by comparing predicted versus actual 'y' values.\n\n6. **Main Execution**:\n   - `main()` function orchestrates loading, preprocessing, model training, and evaluation, returning the RMSE value for the model's predictions on the test data.\n\nThese components are designed to seamlessly integrate within the main function, which can be triggered without additional input parameters.",
                "main_function_name": "main",
                "score": 0.1324552436226345,
                "pass_rate": 0.0,
                "pass_rate_score": 0.0,
                "prediction_score": 0.0,
                "pylint_score": 0.58,
                "radon_score": 0.7445524362263451,
                "test_case_results": {
                    "runnability_check": {
                        "success": false,
                        "reason": "test_failed",
                        "message": "code is not runnable, error: Traceback (most recent call last):\n  File \"<string>\", line 4, in test_function\n  File \"<string>\", line 119, in main\n  File \"<string>\", line 96, in evaluate_model\n  File \"d:\\anaconda3\\envs\\llm\\lib\\site-packages\\torch\\nn\\modules\\module.py\", line 1532, in _wrapped_call_impl\n    return self._call_impl(*args, **kwargs)\n  File \"d:\\anaconda3\\envs\\llm\\lib\\site-packages\\torch\\nn\\modules\\module.py\", line 1541, in _call_impl\n    return forward_call(*args, **kwargs)\n  File \"<string>\", line 59, in forward\n  File \"d:\\anaconda3\\envs\\llm\\lib\\site-packages\\torch\\nn\\modules\\module.py\", line 1532, in _wrapped_call_impl\n    return self._call_impl(*args, **kwargs)\n  File \"d:\\anaconda3\\envs\\llm\\lib\\site-packages\\torch\\nn\\modules\\module.py\", line 1541, in _call_impl\n    return forward_call(*args, **kwargs)\n  File \"d:\\anaconda3\\envs\\llm\\lib\\site-packages\\torch\\nn\\modules\\linear.py\", line 116, in forward\n    return F.linear(input, self.weight, self.bias)\nRuntimeError: mat1 and mat2 shapes cannot be multiplied (242x27 and 28x64)\n"
                    }
                },
                "test_weights": {
                    "runnability_check": 0.001
                }
            }
        },
        "2": {
            "code_0": {
                "code": "import pandas as pd\nimport numpy as np\nimport torch\nimport torch.nn as nn\nimport torch.optim as optim\nfrom sklearn.preprocessing import StandardScaler, OneHotEncoder\nfrom sklearn.metrics import mean_squared_error\n\ndef load_data(train_path: str, test_path: str):\n    train_df = pd.read_excel(train_path)\n    test_df = pd.read_excel(test_path)\n    return train_df, test_df\n\ndef preprocess_data(data: pd.DataFrame, wave_encoder=None, scaler=None):\n    data = data.dropna(subset=['y'])\n\n    if wave_encoder is None:\n        wave_encoder = OneHotEncoder(sparse=False, handle_unknown='ignore')\n        wave_encoded = wave_encoder.fit_transform(data[['Dominant Wave Direction']])\n    else:\n        wave_encoded = wave_encoder.transform(data[['Dominant Wave Direction']])\n\n    wave_dir_df = pd.DataFrame(wave_encoded, columns=wave_encoder.get_feature_names_out(['Dominant Wave Direction']))\n    data = data.drop(columns=['Dominant Wave Direction']).reset_index(drop=True)\n    data = pd.concat([data, wave_dir_df], axis=1)\n\n    if scaler is None:\n        scaler = StandardScaler()\n        numerical_features = data.drop(columns=['y']).columns\n        data[numerical_features] = scaler.fit_transform(data[numerical_features])\n    else:\n        numerical_features = data.drop(columns=['y']).columns\n        data[numerical_features] = scaler.transform(data[numerical_features])\n\n    return data, wave_encoder, scaler\n\ndef bruun_model(S: float, L: float, d: float, B: float):\n    if (d + B) == 0:\n        return 0\n    delta_y = (S * L) / (d + B)\n    return delta_y\n\ndef deep_learning_model(train_df: pd.DataFrame):\n    class SimpleRegressor(nn.Module):\n        def __init__(self, input_dim):\n            super(SimpleRegressor, self).__init__()\n            self.linear1 = nn.Linear(input_dim, 64)\n            self.relu = nn.ReLU()\n            self.linear2 = nn.Linear(64, 1)\n\n        def forward(self, x):\n            x = self.linear1(x)\n            x = self.relu(x)\n            x = self.linear2(x)\n            return x\n\n    X_train = train_df.drop(columns=['y']).values.astype(np.float32)\n    y_train = train_df['y'].values.astype(np.float32).reshape(-1, 1)\n\n    input_dim = X_train.shape[1]\n    model = SimpleRegressor(input_dim)\n    criterion = nn.MSELoss()\n    optimizer = optim.Adam(model.parameters(), lr=0.001)\n\n    for epoch in range(1000):\n        model.train()\n        optimizer.zero_grad()\n        predictions = model(torch.from_numpy(X_train))\n        loss = criterion(predictions, torch.from_numpy(y_train))\n        loss.backward()\n        optimizer.step()\n\n    return model\n\ndef evaluate_model(model: torch.nn.Module, test_df: pd.DataFrame):\n    X_test = test_df.drop(columns=['y']).values.astype(np.float32)\n    y_test = test_df['y'].values.astype(np.float32).reshape(-1, 1)\n\n    model.eval()\n    with torch.no_grad():\n        predictions = model(torch.from_numpy(X_test)).numpy()\n\n    rmse = np.sqrt(mean_squared_error(y_test, predictions))\n    return rmse\n\ndef main():\n    train_df, test_df = load_data(\"beach_profile_data/processed_data/beachdata_train.xlsx\",\n                                  \"beach_profile_data/processed_data/beachdata_test.xlsx\")\n    \n    train_df, wave_encoder, scaler = preprocess_data(train_df)\n    test_df, _, _ = preprocess_data(test_df, wave_encoder, scaler)\n    \n    bruunn_result = bruun_model(S=1.0, L=100.0, d=5.0, B=2.0)\n    \n    trained_model = deep_learning_model(train_df)\n    rmse = evaluate_model(trained_model, test_df)\n\n    return rmse",
                "plan": "The script workflow proceeds as follows:\n\n1. **Loading Data**: The `load_data` function reads the training and testing datasets from Excel files, returning them as pandas DataFrames.\n\n2. **Preprocessing**: The `preprocess_data` function handles missing values, encodes the categorical 'Dominant Wave Direction', and standardizes the numerical features. One-hot encoding and feature scaling are managed by `OneHotEncoder` and `StandardScaler`. These transformations are reused for both train and test sets to ensure consistency in preprocessing.\n\n3. **Bruun Model**: A simple function, `bruun_model`, applies the Bruun Rule for shoreline movement estimation, although it's illustrative here rather than linked with actual predictions.\n\n4. **Deep Learning Model**: The `deep_learning_model` function initializes and trains a simple feed-forward neural network using PyTorch to predict the target variable `y` from preprocessed features. It ensures the input dimension matches the number of features post-preprocessing.\n\n5. **Model Evaluation**: The `evaluate_model` function predicts target values for the test set and computes the RMSE metric to assess model performance.\n\n6. **Main Function**: The `main` function orchestrates loading data, applying preprocessing, running baseline models, training the deep learning model, and evaluating it, returning the performance metric.",
                "main_function_name": "main",
                "score": 0.8117125866979574,
                "pass_rate": 1.0,
                "pass_rate_score": 1.0,
                "prediction_score": 0.0,
                "pylint_score": 0.6759999999999999,
                "radon_score": 0.44112586697957484,
                "test_case_results": {
                    "runnability_check": {
                        "success": true,
                        "reason": null,
                        "message": "code is runnable"
                    }
                },
                "test_weights": {
                    "runnability_check": 0.001
                }
            }
        }
    },
    {
        "0": {
            "code_0": {
                "code": "import pandas as pd\nimport numpy as np\nfrom sklearn.preprocessing import OneHotEncoder, MinMaxScaler\nimport torch\nimport torch.nn as nn\n\n# Component: load_data\ndef load_data(train_path: str, test_path: str):\n    # Load data from the specified Excel files into pandas DataFrames\n    train_df = pd.read_excel(train_path)\n    test_df = pd.read_excel(test_path)\n    return train_df, test_df\n\n# Component: preprocess_data\ndef preprocess_data(df: pd.DataFrame):\n    # Preprocess data: normalize numerical features, one-hot encode categorical features\n    # One-hot encode 'Dominant Wave Direction'\n    encoders = {}\n    ohe = OneHotEncoder(sparse=False)\n    encoded_columns = ohe.fit_transform(df[['Dominant Wave Direction']])\n    encoded_df = pd.DataFrame(encoded_columns, columns=ohe.get_feature_names_out(['Dominant Wave Direction']))\n    \n    # Normalize numerical features\n    numerical_features = df.select_dtypes(include=[np.number]).columns.tolist()\n    numerical_features.remove('x') # We'll keep 'x' as raw for spatial relation possibly\n    numerical_features.remove('y')\n    scaler = MinMaxScaler()\n    df[numerical_features] = scaler.fit_transform(df[numerical_features])\n    \n    # Combine the encoded columns with the original DataFrame\n    processed_df = pd.concat([df, encoded_df], axis=1).drop('Dominant Wave Direction', axis=1)\n    encoders['onehot'] = ohe\n    encoders['scaler'] = scaler\n\n    return processed_df, encoders\n\n# Component: feature_engineering\ndef feature_engineering(df: pd.DataFrame):\n    # Add new features such as wave height multiplied by tidal range\n    df['WaveHeight_TidalRange'] = df['Breaker Wave Height Hb'] * df['Annual Mean Tidal Range']\n    return df\n\n# Component: build_deep_learning_model\nclass BeachProfileModel(nn.Module):\n    def __init__(self, input_size, hidden_size, output_size):\n        super(BeachProfileModel, self).__init__()\n        self.conv1 = nn.Conv1d(1, 16, kernel_size=3, padding=1)\n        self.conv2 = nn.Conv1d(16, 32, kernel_size=3, padding=1)\n        self.fc1 = nn.Linear(32, hidden_size)\n        self.fc2 = nn.Linear(hidden_size, output_size)\n        \n    def forward(self, x):\n        x = torch.relu(self.conv1(x))\n        x = torch.relu(self.conv2(x))\n        x = x.view(x.size(0), -1)  # Flatten the output from conv layer\n        x = torch.relu(self.fc1(x))\n        x = self.fc2(x)\n        return x\n\ndef build_deep_learning_model(input_size: int, hidden_size: int, output_size: int):\n    # Build and return an initialized PyTorch model\n    model = BeachProfileModel(input_size, hidden_size, output_size)\n    return model\n\n# Component: apply_bruun_and_dean_models\ndef apply_bruun_and_dean_models(x_series: pd.Series, empirical_params: list, A_const: float):\n    # Implementing Dean's Model: h(x) = A * x^(2/3)\n    predicted_depths = (A_const * (x_series ** (2/3))).to_numpy()\n    return predicted_depths\n\n# Main integrating function\ndef main():\n    # Load Data\n    train_df, test_df = load_data(\n        \"beach_profile_data/processed_data/beachdata_train.xlsx\",\n        \"beach_profile_data/processed_data/beachdata_test.xlsx\"\n    )\n\n    # Preprocess Data\n    processed_train_df, encoders = preprocess_data(train_df)\n    processed_test_df, _ = preprocess_data(test_df)\n\n    # Feature Engineering\n    engineered_train_df = feature_engineering(processed_train_df)\n    engineered_test_df = feature_engineering(processed_test_df)\n\n    # Assume calculated input size and empirical parameters\n    input_size = engineered_train_df.shape[1] - 1  # total features minus target column 'y'\n    hidden_size = 64  # Example hidden layer size\n    output_size = 1\n    A_const = 0.1  # Hypothetical constant based on Dean's Model, to be tuned/learned\n\n    # Build Model\n    model = build_deep_learning_model(input_size, hidden_size, output_size)\n\n    # Apply Bruun and Dean Models as per requirement\n    predicted_elevations = apply_bruun_and_dean_models(engineered_train_df['x'], [], A_const)\n\n    return model",
                "plan": "1. **load_data**: This function reads training and test data from their respective Excel files into Pandas DataFrames for further processing.\n2. **preprocess_data**: This function one-hot encodes the categorical feature `Dominant Wave Direction` and scales all numerical features except for 'x' and 'y'. We combine this with the original DataFrame to produce the preprocessed data.\n3. **feature_engineering**: This step creates additional features from the existing dataset, such as combining wave height with tidal range, which might have significant effects on beach profile.\n4. **build_deep_learning_model**: Here, we define a PyTorch neural network using convolutional and fully connected layers to model the complexity of spatial and other interactions present in the data.\n5. **apply_bruun_and_dean_models**: We implement Dean's model to predict elevation changes based on the distance variable 'x', using a constant that may be empirically determined.\n6. **main**: This function integrates all components for loading data, preprocessing, feature engineering, building the deep learning model, and applying coastal prediction models. It initializes these processes and outputs the configured PyTorch model.",
                "main_function_name": "main",
                "score": 0.8374300011681571,
                "pass_rate": 1.0,
                "pass_rate_score": 1.0,
                "prediction_score": 0.0,
                "pylint_score": 0.61,
                "radon_score": 0.7643000116815725,
                "test_case_results": {
                    "runnability_check": {
                        "success": true,
                        "reason": null,
                        "message": "code is runnable"
                    }
                },
                "test_weights": {
                    "runnability_check": 0.07692307692307693
                }
            }
        }
    },
    {
        "0": {
            "code_0": {
                "code": "import pandas as pd\nimport torch\nimport torch.nn as nn\nimport torch.optim as optim\nfrom sklearn.preprocessing import OneHotEncoder, StandardScaler\nfrom sklearn.metrics import mean_squared_error\n\n# Component: data_loader\ndef data_loader(train_path, test_path):\n    # Load training and test datasets\n    train_df = pd.read_excel(train_path)\n    test_df = pd.read_excel(test_path)\n    \n    # Return the loaded DataFrames\n    return train_df, test_df\n\n# Component: feature_engineering\ndef feature_engineering(df):\n    # One-hot encode the 'Dominant Wave Direction' categorical feature\n    ohe = OneHotEncoder(sparse=False)\n    wave_directions = ohe.fit_transform(df[['Dominant Wave Direction']])\n    \n    # Standardize numerical features\n    numerical_features = ['x', 'Annual Mean Wave Height']\n    scaler = StandardScaler()\n    scaled_numerics = scaler.fit_transform(df[numerical_features])\n    \n    # Combine transformed features\n    transformed_df = pd.DataFrame(scaled_numerics, columns=numerical_features)\n    wave_directions_df = pd.DataFrame(wave_directions, columns=ohe.get_feature_names_out(['Dominant Wave Direction']))\n    \n    # Concatenate all features\n    final_df = pd.concat([transformed_df, wave_directions_df], axis=1)\n    return final_df\n\n# Component: bruun_model\ndef bruun_model(df):\n    # Assuming a fixed slope, simulate profile change (simplified)\n    slope = 0.01  # Example value\n    sea_level_change = df['x'] * slope\n    return pd.Series(sea_level_change, name='Bruun Prediction')\n\n# Component: dean_model\ndef dean_model(df, A=0.1):\n    # Dean Model prediction\n    dean_prediction = A * (df['x'] ** (2/3))\n    return pd.Series(dean_prediction, name='Dean Prediction')\n\n# Component: deep_learning_model\ndef deep_learning_model(train_df, test_df):\n    class SimpleNN(nn.Module):\n        def __init__(self, input_size, hidden_size, output_size):\n            super(SimpleNN, self).__init__()\n            self.fc1 = nn.Linear(input_size, hidden_size)\n            self.relu = nn.ReLU()\n            self.fc2 = nn.Linear(hidden_size, output_size)\n        \n        def forward(self, x):\n            out = self.fc1(x)\n            out = self.relu(out)\n            out = self.fc2(out)\n            return out\n    \n    # Initialize model, loss function, and optimizer\n    input_size = train_df.shape[1]\n    model = SimpleNN(input_size, 100, 1)\n    criterion = nn.MSELoss()\n    optimizer = optim.Adam(model.parameters(), lr=0.01)\n    \n    # Convert data to PyTorch tensors\n    X_train = torch.tensor(train_df.values, dtype=torch.float32)\n    y_train = torch.tensor(train_df['y'].values, dtype=torch.float32).view(-1, 1)\n    X_test = torch.tensor(test_df.values, dtype=torch.float32)\n    \n    # Train the model\n    model.train()\n    for epoch in range(500):\n        optimizer.zero_grad()\n        outputs = model(X_train)\n        loss = criterion(outputs, y_train)\n        loss.backward()\n        optimizer.step()\n        \n    # Return the trained model\n    return model\n\n# Component: model_evaluator\ndef model_evaluator(model, test_df):\n    # Prepare test data\n    model.eval()\n    X_test = torch.tensor(test_df.values, dtype=torch.float32)\n    y_true = test_df['y'].values\n    \n    # Predict using the trained model\n    with torch.no_grad():\n        y_pred = model(X_test).numpy().reshape(-1)\n    \n    # Compute RMSE\n    rmse = mean_squared_error(y_true, y_pred, squared=False)\n    return {'RMSE': rmse}\n\n# Main function integrating all components\ndef main():\n    # Paths to the datasets\n    train_path = \"beach_profile_data/processed_data/beachdata_train.xlsx\"\n    test_path = \"beach_profile_data/processed_data/beachdata_test.xlsx\"\n\n    # Execute the workflow\n    train_df, test_df = data_loader(train_path, test_path)\n    engineered_train_df = feature_engineering(train_df)\n    engineered_test_df = feature_engineering(test_df)\n    \n    bruun_predictions = bruun_model(train_df)\n    dean_predictions = dean_model(train_df)\n    \n    model = deep_learning_model(engineered_train_df, engineered_test_df)\n    evaluation_result = model_evaluator(model, engineered_test_df)\n    \n    return evaluation_result",
                "plan": "The code implements a comprehensive process combining traditional coastal models (Bruun and Dean) with a deep learning model to predict changes in coastal elevation. Here is a detailed explanation of each component:\n\n1. **data_loader**: This function reads training and testing datasets from specified Excel files, returning them as pandas DataFrames for ease of manipulation.\n\n2. **feature_engineering**: Categorical data ('Dominant Wave Direction') is one-hot encoded here, while selected numerical features are standardized for consistency. This preprocessing ensures that the data is well-prepared for training the neural network.\n\n3. **bruun_model**: This function simulates coastal profile changes using the Bruun model, mathematically simplified for demonstration. The simulation assumes a constant parameter for slope.\n\n4. **dean_model**: Similar to the Bruun model, this function uses the Dean model to predict equilibrium beach profiles, emphasizing the relation between y as depth and x as distance offshore, with parameter A controlling prediction strength.\n\n5. **deep_learning_model**: A PyTorch-based neural network model is constructed, trained on the preprocessed features to learn complex patterns and predict the target variable ('y'). The model architecture is kept simple for this application but could be extended with further complexity.\n\n6. **model_evaluator**: This function evaluates the trained model using prediction metrics (RMSE) on the test dataset to determine its predictive performance, ensuring that the model can generalize well beyond the training data.\n\nIn the **main** function, each component is executed in sequence, ultimately returning the performance evaluation metrics of the deep learning model.",
                "main_function_name": "main",
                "score": 0.12314270374630851,
                "pass_rate": 0.0,
                "pass_rate_score": 0.0,
                "prediction_score": 0.0,
                "pylint_score": 0.493,
                "radon_score": 0.738427037463085,
                "test_case_results": {
                    "runnability_check": {
                        "success": false,
                        "reason": "test_failed",
                        "message": "code is not runnable, error: Traceback (most recent call last):\n  File \"<string>\", line 4, in test_function\n  File \"<string>\", line 110, in main\n  File \"<string>\", line 26, in feature_engineering\n  File \"d:\\anaconda3\\envs\\llm\\lib\\site-packages\\pandas\\core\\frame.py\", line 3902, in __getitem__\n    indexer = self.columns._get_indexer_strict(key, \"columns\")[1]\n  File \"d:\\anaconda3\\envs\\llm\\lib\\site-packages\\pandas\\core\\indexes\\base.py\", line 6114, in _get_indexer_strict\n    self._raise_if_missing(keyarr, indexer, axis_name)\n  File \"d:\\anaconda3\\envs\\llm\\lib\\site-packages\\pandas\\core\\indexes\\base.py\", line 6178, in _raise_if_missing\n    raise KeyError(f\"{not_found} not in index\")\nKeyError: \"['Annual Mean Wave Height'] not in index\"\n"
                    }
                },
                "test_weights": {
                    "runnability_check": 0.007100591715976331
                }
            }
        },
        "1": {
            "code_0": {
                "code": "import pandas as pd\nimport torch\nimport torch.nn as nn\nimport torch.optim as optim\nfrom sklearn.preprocessing import OneHotEncoder, StandardScaler\nfrom sklearn.metrics import mean_squared_error\n\n# Component: data_loader\ndef data_loader(train_path, test_path):\n    # Load training and test datasets\n    train_df = pd.read_excel(train_path)\n    test_df = pd.read_excel(test_path)\n    return train_df, test_df\n\n# Component: feature_engineering\ndef feature_engineering(df):\n    # One-hot encode the 'Dominant Wave Direction' categorical feature\n    ohe = OneHotEncoder(sparse=False)\n    wave_directions = ohe.fit_transform(df[['Dominant Wave Direction']])\n\n    # Standardize numerical features\n    numerical_features = ['x', 'Breaker Wave Height Hb', 'Deep Water Wave Height Hd']\n    scaler = StandardScaler()\n    scaled_numerics = scaler.fit_transform(df[numerical_features])\n\n    # Combine transformed features\n    transformed_df = pd.DataFrame(scaled_numerics, columns=numerical_features)\n    wave_directions_df = pd.DataFrame(wave_directions, columns=ohe.get_feature_names_out(['Dominant Wave Direction']))\n\n    # Concatenate all features\n    final_df = pd.concat([transformed_df, wave_directions_df], axis=1)\n    return final_df\n\n# Component: bruun_model\ndef bruun_model(df):\n    # Example slope for the Bruun model\n    slope = 0.01\n    sea_level_change = df['x'] * slope\n    return pd.Series(sea_level_change, name='Bruun Prediction')\n\n# Component: dean_model\ndef dean_model(df, A=0.1):\n    dean_prediction = A * (df['x'] ** (2/3))\n    return pd.Series(dean_prediction, name='Dean Prediction')\n\n# Component: deep_learning_model\ndef deep_learning_model(train_df, test_df):\n    class SimpleNN(nn.Module):\n        def __init__(self, input_size, hidden_size, output_size):\n            super(SimpleNN, self).__init__()\n            self.fc1 = nn.Linear(input_size, hidden_size)\n            self.relu = nn.ReLU()\n            self.fc2 = nn.Linear(hidden_size, output_size)\n        \n        def forward(self, x):\n            out = self.fc1(x)\n            out = self.relu(out)\n            out = self.fc2(out)\n            return out\n\n    # Prepare model, loss function, optimizer\n    input_size = train_df.shape[1]\n    model = SimpleNN(input_size, 100, 1)\n    criterion = nn.MSELoss()\n    optimizer = optim.Adam(model.parameters(), lr=0.01)\n\n    # Convert data to PyTorch tensors\n    X_train = torch.tensor(train_df.values, dtype=torch.float32)\n    y_train = torch.tensor(train_df['y'].values, dtype=torch.float32).view(-1, 1)\n    X_test = torch.tensor(test_df.values, dtype=torch.float32)\n\n    # Train the model\n    model.train()\n    for epoch in range(500):\n        optimizer.zero_grad()\n        outputs = model(X_train)\n        loss = criterion(outputs, y_train)\n        loss.backward()\n        optimizer.step()\n\n    # Return the trained model\n    return model\n\n# Component: model_evaluator\ndef model_evaluator(model, test_df):\n    model.eval()\n    X_test = torch.tensor(test_df.values, dtype=torch.float32)\n    y_true = test_df['y'].values\n\n    with torch.no_grad():\n        y_pred = model(X_test).numpy().reshape(-1)\n\n    rmse = mean_squared_error(y_true, y_pred, squared=False)\n    return {'RMSE': rmse}\n\n# Main function integrating all components\ndef main():\n    train_path = \"beach_profile_data/processed_data/beachdata_train.xlsx\"\n    test_path = \"beach_profile_data/processed_data/beachdata_test.xlsx\"\n\n    train_df, test_df = data_loader(train_path, test_path)\n    engineered_train_df = feature_engineering(train_df)\n    engineered_test_df = feature_engineering(test_df)\n\n    bruun_predictions = bruun_model(train_df)\n    dean_predictions = dean_model(train_df)\n\n    model = deep_learning_model(engineered_train_df, engineered_test_df)\n    evaluation_result = model_evaluator(model, engineered_test_df)\n    \n    return evaluation_result",
                "plan": "1. **Data Loading**: The `data_loader` function reads the training and test datasets using `pandas.read_excel`, returning dataframes for further processing.\n   \n2. **Feature Engineering**: The `feature_engineering` function:\n   - One-hot encodes the 'Dominant Wave Direction', handling categorical data via the `OneHotEncoder`.\n   - Selects and standardizes numerical features related to the coastal profile, such as 'x', 'Breaker Wave Height Hb', 'Deep Water Wave Height Hd'.\n   - Combines both encoded and numerical data into a final dataframe for model input.\n\n3. **Bruun and Dean Models**: \n   - The `bruun_model` function executes a simplified linear model predicting sea-level changes based on distance.\n   - The `dean_model` provides a power-law based prediction, aligning with the Dean model's theoretical structure.\n\n4. **Deep Learning Model**: \n   - Implemented using PyTorch, `SimpleNN` constructs a feed-forward neural network with one hidden layer.\n   - The function compiles and trains this model, outputting predictions for input data.\n\n5. **Model Evaluation**: \n   - Used to compute RMSE for test set predictions compared to true values, thereby appraising model performance.\n\n6. **Main Function**: The `main()` function orchestrates the entire workflow, from data preparation to model evaluation, and returns the evaluation result.",
                "main_function_name": "main",
                "score": 0.13686214106091554,
                "pass_rate": 0.0,
                "pass_rate_score": 0.0,
                "prediction_score": 0.0,
                "pylint_score": 0.658,
                "radon_score": 0.7106214106091552,
                "test_case_results": {
                    "runnability_check": {
                        "success": false,
                        "reason": "test_failed",
                        "message": "code is not runnable, error: Traceback (most recent call last):\n  File \"d:\\anaconda3\\envs\\llm\\lib\\site-packages\\pandas\\core\\indexes\\base.py\", line 3790, in get_loc\n    return self._engine.get_loc(casted_key)\n  File \"index.pyx\", line 152, in pandas._libs.index.IndexEngine.get_loc\n  File \"index.pyx\", line 181, in pandas._libs.index.IndexEngine.get_loc\n  File \"pandas\\_libs\\hashtable_class_helper.pxi\", line 7080, in pandas._libs.hashtable.PyObjectHashTable.get_item\n  File \"pandas\\_libs\\hashtable_class_helper.pxi\", line 7088, in pandas._libs.hashtable.PyObjectHashTable.get_item\nKeyError: 'y'\n\nThe above exception was the direct cause of the following exception:\n\nTraceback (most recent call last):\n  File \"<string>\", line 4, in test_function\n  File \"<string>\", line 108, in main\n  File \"<string>\", line 69, in deep_learning_model\n  File \"d:\\anaconda3\\envs\\llm\\lib\\site-packages\\pandas\\core\\frame.py\", line 3896, in __getitem__\n    indexer = self.columns.get_loc(key)\n  File \"d:\\anaconda3\\envs\\llm\\lib\\site-packages\\pandas\\core\\indexes\\base.py\", line 3797, in get_loc\n    raise KeyError(key) from err\nKeyError: 'y'\n"
                    }
                },
                "test_weights": {
                    "runnability_check": 0.001
                }
            }
        },
        "2": {
            "code_0": {
                "code": "import pandas as pd\nimport torch\nimport torch.nn as nn\nimport torch.optim as optim\nfrom sklearn.preprocessing import OneHotEncoder, StandardScaler\nfrom sklearn.metrics import mean_squared_error\n\n# Component: data_loader\ndef data_loader(train_path, test_path):\n    # Load training and test datasets\n    train_df = pd.read_excel(train_path)\n    test_df = pd.read_excel(test_path)\n    return train_df, test_df\n\n# Component: feature_engineering\ndef feature_engineering(df, target_col='y'):\n    # One-hot encode the 'Dominant Wave Direction' categorical feature\n    ohe = OneHotEncoder(sparse=False)\n    wave_directions = ohe.fit_transform(df[['Dominant Wave Direction']])\n\n    # Standardize numerical features\n    numerical_features = ['x', 'Breaker Wave Height Hb', 'Deep Water Wave Height Hd']\n    scaler = StandardScaler()\n    scaled_numerics = scaler.fit_transform(df[numerical_features])\n\n    # Combine transformed features\n    transformed_df = pd.DataFrame(scaled_numerics, columns=numerical_features)\n    wave_directions_df = pd.DataFrame(wave_directions, columns=ohe.get_feature_names_out(['Dominant Wave Direction']))\n\n    # Concatenate all features and retain target column\n    final_df = pd.concat([transformed_df, wave_directions_df, df[[target_col]]], axis=1)\n    return final_df\n\n# Component: bruun_model\ndef bruun_model(df):\n    # Example slope for the Bruun model\n    slope = 0.01\n    sea_level_change = df['x'] * slope\n    return pd.Series(sea_level_change, name='Bruun Prediction')\n\n# Component: dean_model\ndef dean_model(df, A=0.1):\n    dean_prediction = A * (df['x'] ** (2/3))\n    return pd.Series(dean_prediction, name='Dean Prediction')\n\n# Component: deep_learning_model\ndef deep_learning_model(train_df, test_df):\n    class SimpleNN(nn.Module):\n        def __init__(self, input_size, hidden_size, output_size):\n            super(SimpleNN, self).__init__()\n            self.fc1 = nn.Linear(input_size, hidden_size)\n            self.relu = nn.ReLU()\n            self.fc2 = nn.Linear(hidden_size, output_size)\n        \n        def forward(self, x):\n            out = self.fc1(x)\n            out = self.relu(out)\n            out = self.fc2(out)\n            return out\n\n    # Prepare model, loss function, optimizer\n    input_size = train_df.shape[1] - 1  # Subtract 1 for the target column\n    model = SimpleNN(input_size, 100, 1)\n    criterion = nn.MSELoss()\n    optimizer = optim.Adam(model.parameters(), lr=0.01)\n\n    # Convert data to PyTorch tensors\n    X_train = torch.tensor(train_df.drop(columns='y').values, dtype=torch.float32)\n    y_train = torch.tensor(train_df['y'].values, dtype=torch.float32).view(-1, 1)\n    X_test = torch.tensor(test_df.drop(columns='y').values, dtype=torch.float32)\n\n    # Train the model\n    model.train()\n    for epoch in range(500):\n        optimizer.zero_grad()\n        outputs = model(X_train)\n        loss = criterion(outputs, y_train)\n        loss.backward()\n        optimizer.step()\n\n    # Return the trained model\n    return model\n\n# Component: model_evaluator\ndef model_evaluator(model, test_df):\n    model.eval()\n    X_test = torch.tensor(test_df.drop(columns='y').values, dtype=torch.float32)\n    y_true = test_df['y'].values\n\n    with torch.no_grad():\n        y_pred = model(X_test).numpy().reshape(-1)\n\n    rmse = mean_squared_error(y_true, y_pred, squared=False)\n    return {'RMSE': rmse}\n\n# Main function integrating all components\ndef main():\n    train_path = \"beach_profile_data/processed_data/beachdata_train.xlsx\"\n    test_path = \"beach_profile_data/processed_data/beachdata_test.xlsx\"\n\n    train_df, test_df = data_loader(train_path, test_path)\n    engineered_train_df = feature_engineering(train_df)\n    engineered_test_df = feature_engineering(test_df)\n\n    bruun_predictions = bruun_model(train_df)\n    dean_predictions = dean_model(train_df)\n\n    model = deep_learning_model(engineered_train_df, engineered_test_df)\n    evaluation_result = model_evaluator(model, engineered_test_df)\n    \n    return evaluation_result",
                "plan": "1. Load the training and testing datasets from the specified file paths using `data_loader`.\n2. Perform feature engineering on the data:\n   - One-hot encode the 'Dominant Wave Direction'.\n   - Standardize the selected numerical features.\n   - Retain the target column 'y' in the processed dataframe, ensuring it is available for model training.\n3. Implement the Bruun Model and Dean Model to compute and return predictions based on the respective mathematical models.\n4. Define and train a simple feedforward neural network using PyTorch on the processed data:\n   - The input layer size is determined by the number of features.\n   - The model is trained using the Mean Squared Error loss function and Adam optimizer for 500 epochs.\n5. Evaluate the trained neural network model on the test data:\n   - Predict and calculate the RMSE between the predictions and actual target values in the test data.\n6. Return evaluation metrics (in this case, RMSE) as the output of the main function.\n7. Ensure that all processing steps retain the necessary columns, particularly the 'y' column for model training and evaluation.",
                "main_function_name": "main",
                "score": 0.13663708936529292,
                "pass_rate": 0.0,
                "pass_rate_score": 0.0,
                "prediction_score": 0.0,
                "pylint_score": 0.658,
                "radon_score": 0.7083708936529292,
                "test_case_results": {
                    "runnability_check": {
                        "success": false,
                        "reason": "test_failed",
                        "message": "code is not runnable, error: Traceback (most recent call last):\n  File \"<string>\", line 4, in test_function\n  File \"<string>\", line 109, in main\n  File \"<string>\", line 91, in model_evaluator\n  File \"d:\\anaconda3\\envs\\llm\\lib\\site-packages\\torch\\nn\\modules\\module.py\", line 1532, in _wrapped_call_impl\n    return self._call_impl(*args, **kwargs)\n  File \"d:\\anaconda3\\envs\\llm\\lib\\site-packages\\torch\\nn\\modules\\module.py\", line 1541, in _call_impl\n    return forward_call(*args, **kwargs)\n  File \"<string>\", line 56, in forward\n  File \"d:\\anaconda3\\envs\\llm\\lib\\site-packages\\torch\\nn\\modules\\module.py\", line 1532, in _wrapped_call_impl\n    return self._call_impl(*args, **kwargs)\n  File \"d:\\anaconda3\\envs\\llm\\lib\\site-packages\\torch\\nn\\modules\\module.py\", line 1541, in _call_impl\n    return forward_call(*args, **kwargs)\n  File \"d:\\anaconda3\\envs\\llm\\lib\\site-packages\\torch\\nn\\modules\\linear.py\", line 116, in forward\n    return F.linear(input, self.weight, self.bias)\nRuntimeError: mat1 and mat2 shapes cannot be multiplied (242x6 and 7x100)\n"
                    }
                },
                "test_weights": {
                    "runnability_check": 0.001
                }
            }
        },
        "3": {
            "code_0": {
                "code": "import pandas as pd\nimport torch\nimport torch.nn as nn\nimport torch.optim as optim\nfrom sklearn.preprocessing import OneHotEncoder, StandardScaler\nfrom sklearn.metrics import mean_squared_error\n\n# Component: data_loader\ndef data_loader(train_path, test_path):\n    # Load training and test datasets\n    train_df = pd.read_excel(train_path)\n    test_df = pd.read_excel(test_path)\n    return train_df, test_df\n\n# Component: feature_engineering\ndef feature_engineering(df, target_col='y'):\n    # One-hot encode the 'Dominant Wave Direction' categorical feature\n    ohe = OneHotEncoder(sparse=False)\n    wave_directions = ohe.fit_transform(df[['Dominant Wave Direction']])\n\n    # Standardize numerical features\n    numerical_features = ['x', 'Breaker Wave Height Hb', 'Deep Water Wave Height Hd']\n    scaler = StandardScaler()\n    scaled_numerics = scaler.fit_transform(df[numerical_features])\n\n    # Combine transformed features\n    transformed_df = pd.DataFrame(scaled_numerics, columns=numerical_features)\n    wave_directions_df = pd.DataFrame(wave_directions, columns=ohe.get_feature_names_out(['Dominant Wave Direction']))\n\n    # Concatenate all features and retain target column\n    final_df = pd.concat([transformed_df, wave_directions_df, df[[target_col]]], axis=1)\n    return final_df\n\n# Component: bruun_model\ndef bruun_model(df):\n    # Example slope for the Bruun model\n    slope = 0.01\n    sea_level_change = df['x'] * slope\n    return pd.Series(sea_level_change, name='Bruun Prediction')\n\n# Component: dean_model\ndef dean_model(df, A=0.1):\n    dean_prediction = A * (df['x'] ** (2/3))\n    return pd.Series(dean_prediction, name='Dean Prediction')\n\n# Component: deep_learning_model\ndef deep_learning_model(train_df, test_df):\n    class SimpleNN(nn.Module):\n        def __init__(self, input_size, hidden_size, output_size):\n            super(SimpleNN, self).__init__()\n            self.fc1 = nn.Linear(input_size, hidden_size)\n            self.relu = nn.ReLU()\n            self.fc2 = nn.Linear(hidden_size, output_size)\n        \n        def forward(self, x):\n            out = self.fc1(x)\n            out = self.relu(out)\n            out = self.fc2(out)\n            return out\n\n    # Prepare model, loss function, optimizer\n    input_size = train_df.shape[1] - 1  # Subtract 1 for the target column\n    model = SimpleNN(input_size, 100, 1)\n    criterion = nn.MSELoss()\n    optimizer = optim.Adam(model.parameters(), lr=0.01)\n\n    # Convert data to PyTorch tensors\n    X_train = torch.tensor(train_df.drop(columns='y').values, dtype=torch.float32)\n    y_train = torch.tensor(train_df['y'].values, dtype=torch.float32).view(-1, 1)\n    X_test = torch.tensor(test_df.drop(columns='y').values, dtype=torch.float32)\n\n    # Train the model\n    model.train()\n    for epoch in range(500):\n        optimizer.zero_grad()\n        outputs = model(X_train)\n        loss = criterion(outputs, y_train)\n        loss.backward()\n        optimizer.step()\n\n    # Return the trained model\n    return model\n\n# Component: model_evaluator\ndef model_evaluator(model, test_df):\n    model.eval()\n    X_test = torch.tensor(test_df.drop(columns='y').values, dtype=torch.float32)\n    y_true = test_df['y'].values\n\n    with torch.no_grad():\n        y_pred = model(X_test).numpy().reshape(-1)\n\n    rmse = mean_squared_error(y_true, y_pred, squared=False)\n    return {'RMSE': rmse}\n\n# Main function integrating all components\ndef main():\n    train_path = \"beach_profile_data/processed_data/beachdata_train.xlsx\"\n    test_path = \"beach_profile_data/processed_data/beachdata_test.xlsx\"\n\n    train_df, test_df = data_loader(train_path, test_path)\n    engineered_train_df = feature_engineering(train_df)\n    engineered_test_df = feature_engineering(test_df)\n\n    bruun_predictions = bruun_model(train_df)\n    dean_predictions = dean_model(train_df)\n\n    model = deep_learning_model(engineered_train_df, engineered_test_df)\n    evaluation_result = model_evaluator(model, engineered_test_df)\n    \n    return evaluation_result",
                "plan": "1. **Data Loading**: The script begins by loading the training and test data sets from the specified Excel file paths using the `pandas` library.\n  \n2. **Feature Engineering**: The categorical column 'Dominant Wave Direction' is one-hot encoded, and several numerical columns are standardized using `StandardScaler`.\n\n3. **Bruun and Dean Models**: Two simple mathematical models, Bruun and Dean, process the distance `x` to generate elevation predictions based on theorized relationships.\n\n4. **Deep Learning Model**: A simple neural network is constructed using PyTorch:\n   - The network consists of a single hidden layer with ReLU activation.\n   - Determines the number of input features dynamically after feature engineering.\n   - The model is trained using mean squared error loss and the Adam optimizer over 500 epochs.\n\n5. **Evaluation**: The model's performance is evaluated using RMSE on the test set.\n\n6. **Integration**: The `main()` function coordinates these components:\n   - Loads data and performs feature engineering.\n   - Makes predictions via the Bruun and Dean models.\n   - Trains and evaluates a deep learning model.\n   \n7. **Output**: The function returns RMSE to assess prediction accuracy.",
                "main_function_name": "main",
                "score": 0.13663708936529292,
                "pass_rate": 0.0,
                "pass_rate_score": 0.0,
                "prediction_score": 0.0,
                "pylint_score": 0.658,
                "radon_score": 0.7083708936529292,
                "test_case_results": {
                    "runnability_check": {
                        "success": false,
                        "reason": "test_failed",
                        "message": "code is not runnable, error: Traceback (most recent call last):\n  File \"<string>\", line 4, in test_function\n  File \"<string>\", line 109, in main\n  File \"<string>\", line 91, in model_evaluator\n  File \"d:\\anaconda3\\envs\\llm\\lib\\site-packages\\torch\\nn\\modules\\module.py\", line 1532, in _wrapped_call_impl\n    return self._call_impl(*args, **kwargs)\n  File \"d:\\anaconda3\\envs\\llm\\lib\\site-packages\\torch\\nn\\modules\\module.py\", line 1541, in _call_impl\n    return forward_call(*args, **kwargs)\n  File \"<string>\", line 56, in forward\n  File \"d:\\anaconda3\\envs\\llm\\lib\\site-packages\\torch\\nn\\modules\\module.py\", line 1532, in _wrapped_call_impl\n    return self._call_impl(*args, **kwargs)\n  File \"d:\\anaconda3\\envs\\llm\\lib\\site-packages\\torch\\nn\\modules\\module.py\", line 1541, in _call_impl\n    return forward_call(*args, **kwargs)\n  File \"d:\\anaconda3\\envs\\llm\\lib\\site-packages\\torch\\nn\\modules\\linear.py\", line 116, in forward\n    return F.linear(input, self.weight, self.bias)\nRuntimeError: mat1 and mat2 shapes cannot be multiplied (242x6 and 7x100)\n"
                    }
                },
                "test_weights": {
                    "runnability_check": 0.001
                }
            }
        },
        "4": {
            "code_0": {
                "code": "import pandas as pd\nimport torch\nimport torch.nn as nn\nimport torch.optim as optim\nfrom sklearn.preprocessing import OneHotEncoder, StandardScaler\nfrom sklearn.metrics import mean_squared_error\n\n# Component: data_loader\ndef data_loader(train_path, test_path):\n    # Load training and test datasets\n    train_df = pd.read_excel(train_path)\n    test_df = pd.read_excel(test_path)\n    return train_df, test_df\n\n# Component: feature_engineering\ndef feature_engineering(df, encoder=None, scaler=None, is_train=True):\n    # One-hot encode the 'Dominant Wave Direction' feature\n    if is_train:\n        ohe = OneHotEncoder(sparse=False)\n        wave_directions = ohe.fit_transform(df[['Dominant Wave Direction']])\n    else:\n        wave_directions = encoder.transform(df[['Dominant Wave Direction']])\n\n    # Standardize numerical features\n    numerical_features = ['x', 'Breaker Wave Height Hb', 'Deep Water Wave Height Hd']\n    if is_train:\n        scaler = StandardScaler()\n        scaled_numerics = scaler.fit_transform(df[numerical_features])\n    else:\n        scaled_numerics = scaler.transform(df[numerical_features])\n\n    # Combine transformed features\n    transformed_df = pd.DataFrame(scaled_numerics, columns=numerical_features)\n    wave_directions_df = pd.DataFrame(wave_directions, columns=ohe.get_feature_names_out(['Dominant Wave Direction']))\n\n    # Concatenate all features and retain target column\n    final_df = pd.concat([transformed_df, wave_directions_df, df[['y']]], axis=1)\n    return final_df, ohe if is_train else None, scaler if is_train else None\n\n# Component: bruun_model\ndef bruun_model(df):\n    # Example slope for the Bruun model\n    slope = 0.01\n    sea_level_change = df['x'] * slope\n    return pd.Series(sea_level_change, name='Bruun Prediction')\n\n# Component: dean_model\ndef dean_model(df, A=0.1):\n    dean_prediction = A * (df['x'] ** (2/3))\n    return pd.Series(dean_prediction, name='Dean Prediction')\n\n# Component: deep_learning_model\ndef deep_learning_model(train_df, test_df):\n    class SimpleNN(nn.Module):\n        def __init__(self, input_size, hidden_size, output_size):\n            super(SimpleNN, self).__init__()\n            self.fc1 = nn.Linear(input_size, hidden_size)\n            self.relu = nn.ReLU()\n            self.fc2 = nn.Linear(hidden_size, output_size)\n        \n        def forward(self, x):\n            out = self.fc1(x)\n            out = self.relu(out)\n            out = self.fc2(out)\n            return out\n\n    # Prepare model, loss function, optimizer\n    input_size = train_df.shape[1] - 1  # Subtract 1 for the target column 'y'\n    model = SimpleNN(input_size, 100, 1)\n    criterion = nn.MSELoss()\n    optimizer = optim.Adam(model.parameters(), lr=0.01)\n\n    # Convert data to PyTorch tensors\n    X_train = torch.tensor(train_df.drop(columns='y').values, dtype=torch.float32)\n    y_train = torch.tensor(train_df['y'].values, dtype=torch.float32).view(-1, 1)\n    X_test = torch.tensor(test_df.drop(columns='y').values, dtype=torch.float32)\n\n    # Train the model\n    model.train()\n    for epoch in range(500):\n        optimizer.zero_grad()\n        outputs = model(X_train)\n        loss = criterion(outputs, y_train)\n        loss.backward()\n        optimizer.step()\n\n    # Return the trained model\n    return model\n\n# Component: model_evaluator\ndef model_evaluator(model, test_df):\n    model.eval()\n    X_test = torch.tensor(test_df.drop(columns='y').values, dtype=torch.float32)\n    y_true = test_df['y'].values\n\n    with torch.no_grad():\n        y_pred = model(X_test).numpy().reshape(-1)\n\n    rmse = mean_squared_error(y_true, y_pred, squared=False)\n    return {'RMSE': rmse}\n\n# Main function integrating all components\ndef main():\n    train_path = \"beach_profile_data/processed_data/beachdata_train.xlsx\"\n    test_path = \"beach_profile_data/processed_data/beachdata_test.xlsx\"\n\n    train_df, test_df = data_loader(train_path, test_path)\n    engineered_train_df, ohe, scaler = feature_engineering(train_df)\n    engineered_test_df, _, _ = feature_engineering(test_df, encoder=ohe, scaler=scaler, is_train=False)\n\n    bruun_predictions = bruun_model(train_df)\n    dean_predictions = dean_model(train_df)\n\n    model = deep_learning_model(engineered_train_df, engineered_test_df)\n    evaluation_result = model_evaluator(model, engineered_test_df)\n    \n    return evaluation_result",
                "plan": "1. **Data Loading**: Load the train and test datasets from Excel files using `pandas.read_excel()`.\n\n2. **Feature Engineering**: \n   - Encode the categorical 'Dominant Wave Direction' using One-Hot Encoding.\n   - Standardize the numerical columns 'x', 'Breaker Wave Height Hb', 'Deep Water Wave Height Hd' using `StandardScaler`.\n   - Ensure that during inference or test, the same encoder and scaler are used to maintain consistency with the training set.\n\n3. **Bruun Model Calculation**:\n   - Implement a simple slope-based calculation using the Bruun Rule.\n\n4. **Dean Model Calculation**:\n   - Implement a power-law expression akin to the Dean Model.\n\n5. **Deep Learning Model**:\n   - Construct a simple feedforward neural network using PyTorch.\n   - Specify the structure with input size matching the number of features after preprocessing.\n   - Train the model on the training data.\n\n6. **Model Evaluation**: \n   - Evaluate the neural network on the test set using RMSE as the metric.\n\n7. **Main Execution**:\n   - Integrate all previous components to manage data flow and evaluate the model, highlighting the prediction's alignment with theoretical models.",
                "main_function_name": "main",
                "score": 0.13513990745348592,
                "pass_rate": 0.0,
                "pass_rate_score": 0.0,
                "prediction_score": 0.0,
                "pylint_score": 0.662,
                "radon_score": 0.6893990745348592,
                "test_case_results": {
                    "runnability_check": {
                        "success": false,
                        "reason": "test_failed",
                        "message": "code is not runnable, error: Traceback (most recent call last):\n  File \"<string>\", line 4, in test_function\n  File \"<string>\", line 109, in main\n  File \"<string>\", line 34, in feature_engineering\nUnboundLocalError: local variable 'ohe' referenced before assignment\n"
                    }
                },
                "test_weights": {
                    "runnability_check": 0.001
                }
            }
        }
    },
    {
        "0": {
            "code_0": {
                "code": "import os\nimport numpy as np\nimport torch\nimport torch.nn as nn\nimport torch.nn.functional as F\nfrom torch.utils.data import Dataset, DataLoader\nfrom torchvision import transforms\nfrom torchvision.transforms import functional as TF\nfrom PIL import Image\nimport random\nimport copy\nimport matplotlib.pyplot as plt\n\n# ---- Component: load_and_preprocess_dataset ----\n\nclass BrainMRISegmentationDataset(Dataset):\n    \"\"\"\n    Custom PyTorch Dataset for paired brain MRI images and masks.\n    Applies preprocessing and augmentations as defined during initialization.\n    \"\"\"\n    def __init__(self, image_mask_pairs, image_size=256, is_train=False):\n        self.image_mask_pairs = image_mask_pairs\n        self.image_size = image_size\n        self.is_train = is_train\n\n    def __len__(self):\n        return len(self.image_mask_pairs)\n\n    def __getitem__(self, idx):\n        img_path, mask_path = self.image_mask_pairs[idx]\n        # Load image (3-channel) and mask (1-channel), convert to numpy\n        image = Image.open(img_path).convert('RGB')\n        mask = Image.open(mask_path).convert('L')\n        # Convert to numpy arrays\n        image = np.array(image).astype(np.float32)\n        mask = np.array(mask).astype(np.uint8)\n\n        # Ensure mask is binary 0/1\n        mask = (mask > 0).astype(np.float32)\n\n        # Per-image normalization (z-score). Add epsilon to denom to prevent divide-by-zero.\n        img_mean = image.mean()\n        img_std = image.std()\n        image = (image - img_mean) / (img_std + 1e-8)\n\n        # Data augmentation: Only for training!\n        if self.is_train:\n            # Random horizontal/vertical flip\n            if random.random() > 0.5:\n                image = np.flip(image, axis=1).copy()\n                mask = np.flip(mask, axis=1).copy()\n            if random.random() > 0.5:\n                image = np.flip(image, axis=0).copy()\n                mask = np.flip(mask, axis=0).copy()\n            # Random 90-degree rotations\n            rot_k = random.randint(0,3)\n            if rot_k > 0:\n                image = np.rot90(image, k=rot_k, axes=(0,1)).copy()\n                mask = np.rot90(mask,  k=rot_k, axes=(0,1)).copy()\n\n        # Resize both image and mask to target size (image_size, image_size)\n        image = Image.fromarray(np.uint8(((image - image.min())/(image.max()-image.min()+1e-8))*255)) # convert back to 0-255 for resizing\n        image = image.resize((self.image_size, self.image_size), resample=Image.BILINEAR)\n        image = np.array(image).astype(np.float32)\n        # Re-normalize after resizing\n        img_mean = image.mean()\n        img_std = image.std()\n        image = (image - img_mean) / (img_std + 1e-8)\n        mask = Image.fromarray(np.uint8(mask*255))\n        mask = mask.resize((self.image_size, self.image_size), resample=Image.NEAREST)\n        mask = np.array(mask).astype(np.float32) / 255.0\n        mask = (mask > 0.5).astype(np.float32)\n\n        # HWC -> CHW\n        image = np.transpose(image, (2,0,1)) # (3,H,W)\n        mask = np.expand_dims(mask, axis=0)  # (1,H,W)\n\n        return torch.tensor(image, dtype=torch.float32), torch.tensor(mask, dtype=torch.float32)\n\ndef load_and_preprocess_dataset(\n    base_path:str, image_size:int, batch_size:int, num_workers:int,\n    aug_crop_percent:float,  # Not used but kept for compatibility\n    train_val_split:float    # Not used as there are explicit splits\n):\n    \"\"\"\n    Loads images and masks from dataset, builds PyTorch Datasets and DataLoaders.\n    Returns:\n        - dataset_dict: {'train': Dataset, 'val': Dataset, 'test': Dataset}\n        - dataloader_dict: {'train': DataLoader, ...}\n    \"\"\"\n    dataset_dict = {}\n    dataloader_dict = {}\n    for split in ['train', 'val', 'test']:\n        images_dir = os.path.join(base_path, split, \"images\")\n        masks_dir = os.path.join(base_path, split, \"masks\")\n        # All image filenames\n        image_files = [f for f in os.listdir(images_dir) if f.endswith('.tif')]\n        # Match masks to images by filename\n        image_mask_pairs = []\n        for img_fn in image_files:\n            base_name = img_fn[:-4] # remove .tif\n            mask_fn = base_name + '_mask.tif'\n            img_path = os.path.join(images_dir, img_fn)\n            mask_path = os.path.join(masks_dir, mask_fn)\n            if os.path.exists(mask_path):\n                image_mask_pairs.append( (img_path, mask_path) )\n        is_train = (split == 'train')\n        dset = BrainMRISegmentationDataset(\n            image_mask_pairs=image_mask_pairs,\n            image_size=image_size,\n            is_train=is_train\n        )\n        dataset_dict[split] = dset\n        shuffle = True if split=='train' else False\n        drop_last = True if split=='train' else False\n        dataloader = DataLoader(\n            dset, batch_size=batch_size, shuffle=shuffle, num_workers=num_workers, pin_memory=True, drop_last=drop_last\n        )\n        dataloader_dict[split] = dataloader\n    return dataset_dict, dataloader_dict\n\n# ---- Component: UNet ----\n\nclass DoubleConv(nn.Module):\n    \"\"\"\n    (Conv2d-BN-ReLU) * 2 used in every U-Net block\n    \"\"\"\n    def __init__(self, in_ch, out_ch, dropout=0.0):\n        super().__init__()\n        layers = [\n            nn.Conv2d(in_ch, out_ch, kernel_size=3, padding=1, bias=False),\n            nn.BatchNorm2d(out_ch),\n            nn.ReLU(inplace=True),\n            nn.Conv2d(out_ch, out_ch, kernel_size=3, padding=1, bias=False),\n            nn.BatchNorm2d(out_ch),\n            nn.ReLU(inplace=True),\n        ]\n        if dropout > 0:\n            layers.append(nn.Dropout2d(dropout))\n        self.double_conv = nn.Sequential(*layers)\n\n    def forward(self, x):\n        return self.double_conv(x)\n\nclass UNet(nn.Module):\n    \"\"\"\n    2D U-Net for flexible input/output sizes\n    \"\"\"\n    def __init__(self, input_channels, output_channels, dropout=0.1):\n        super(UNet, self).__init__()\n        features = [64, 128, 256, 512, 1024]\n        # Encoder\n        self.inc = DoubleConv(input_channels, features[0], dropout)\n        self.down1 = nn.Sequential(\n                nn.MaxPool2d(2), DoubleConv(features[0], features[1], dropout)\n        )\n        self.down2 = nn.Sequential(\n                nn.MaxPool2d(2), DoubleConv(features[1], features[2], dropout)\n        )\n        self.down3 = nn.Sequential(\n                nn.MaxPool2d(2), DoubleConv(features[2], features[3], dropout)\n        )\n        self.down4 = nn.Sequential(\n                nn.MaxPool2d(2), DoubleConv(features[3], features[4], dropout)\n        )\n        # Decoder\n        self.up1 = nn.ConvTranspose2d(features[4], features[3], kernel_size=2, stride=2)\n        self.conv_up1 = DoubleConv(features[4], features[3], dropout)\n        self.up2 = nn.ConvTranspose2d(features[3], features[2], kernel_size=2, stride=2)\n        self.conv_up2 = DoubleConv(features[3], features[2], dropout)\n        self.up3 = nn.ConvTranspose2d(features[2], features[1], kernel_size=2, stride=2)\n        self.conv_up3 = DoubleConv(features[2], features[1], dropout)\n        self.up4 = nn.ConvTranspose2d(features[1], features[0], kernel_size=2, stride=2)\n        self.conv_up4 = DoubleConv(features[1], features[0], dropout)\n        self.outc = nn.Conv2d(features[0], output_channels, kernel_size=1)\n\n    def forward(self, x):\n        x1 = self.inc(x) # (b,64,H,W)\n        x2 = self.down1(x1) # (b,128,H/2,W/2)\n        x3 = self.down2(x2) # (b,256,H/4,W/4)\n        x4 = self.down3(x3) # (b,512,H/8,W/8)\n        x5 = self.down4(x4) # (b,1024,H/16,W/16)\n\n        u1 = self.up1(x5)\n        u1 = torch.cat([u1, x4], dim=1)\n        u1 = self.conv_up1(u1)\n        u2 = self.up2(u1)\n        u2 = torch.cat([u2, x3], dim=1)\n        u2 = self.conv_up2(u2)\n        u3 = self.up3(u2)\n        u3 = torch.cat([u3, x2], dim=1)\n        u3 = self.conv_up3(u3)\n        u4 = self.up4(u3)\n        u4 = torch.cat([u4, x1], dim=1)\n        u4 = self.conv_up4(u4)\n        out = self.outc(u4)\n        return out\n\n# ---- Component: dice_coefficient ----\n\ndef dice_coefficient(pred_logits:torch.Tensor, gt_mask:torch.Tensor, threshold:float=0.5):\n    \"\"\"\n    Computes Dice coefficient for batched prediction logits and gt_mask.\n    Args:\n        pred_logits: (B,1,H,W), raw logits from model\n        gt_mask: (B,1,H,W) or (B,H,W), float32 0/1\n        threshold: threshold on sigmoid(pred_logits)\n    Returns:\n        dice (float): averaged over batch\n    \"\"\"\n    pred_probs = torch.sigmoid(pred_logits)\n    pred_bin = (pred_probs > threshold).float()\n    gt = gt_mask.float()\n    # Flatten for each sample\n    B = pred_bin.shape[0]\n    dice_scores = []\n    for i in range(B):\n        p = pred_bin[i].view(-1)\n        g = gt[i].view(-1)\n        intersection = (p * g).sum()\n        denom = p.sum() + g.sum()\n        if denom.item() == 0:\n            dice = 1.0  # If both pred and gt are all zero, count as perfect.\n        else:\n            dice = 2.0 * intersection.item() / (denom.item() + 1e-8)\n        dice_scores.append(dice)\n    # Mean over batch\n    return float(np.mean(dice_scores))\n\n# ---- Component: train_segmentation_model ----\n\ndef train_segmentation_model(\n    model, dataset_dict, dataloader_dict, num_epochs:int,\n    learning_rate:float, device:torch.device,\n    patience:int=10, dice_loss_weight:float=0.4\n):\n    \"\"\"\n    Trains U-Net model using BCEWithLogits and Dice losses, validates per epoch.\n    Returns:\n        best_model (nn.Module): Model with best validation Dice.\n        history: list of dicts of loss/metric per epoch.\n    \"\"\"\n    model = model.to(device)\n    optimizer = torch.optim.Adam(model.parameters(), lr=learning_rate)\n    bce_loss_fn = nn.BCEWithLogitsLoss()\n    best_val_dice = -np.inf\n    best_model_wts = copy.deepcopy(model.state_dict())\n    epochs_no_improve = 0\n    history = []\n\n    train_loader = dataloader_dict['train']\n    val_loader = dataloader_dict['val']\n\n    for epoch in range(num_epochs):\n        model.train()\n        train_losses = []\n        train_dice_scores = []\n\n        for imgs, masks in train_loader:\n            imgs = imgs.to(device, non_blocking=True)\n            masks = masks.to(device, non_blocking=True)\n            optimizer.zero_grad()\n            logits = model(imgs)\n            bce = bce_loss_fn(logits, masks)\n            dice = 1.0 - dice_coefficient(logits.detach(), masks.detach())\n            loss = (1-dice_loss_weight)*bce + dice_loss_weight*dice\n            loss.backward()\n            optimizer.step()\n            train_losses.append(loss.item())\n            train_dice_scores.append(1.-dice)\n\n        # Validation\n        model.eval()\n        val_losses = []\n        val_dice_scores = []\n        with torch.no_grad():\n            for imgs, masks in val_loader:\n                imgs = imgs.to(device, non_blocking=True)\n                masks = masks.to(device, non_blocking=True)\n                logits = model(imgs)\n                bce = bce_loss_fn(logits, masks)\n                dice = 1.0 - dice_coefficient(logits, masks)\n                loss = (1-dice_loss_weight)*bce + dice_loss_weight*dice\n                val_losses.append(loss.item())\n                val_dice_scores.append(1.-dice)\n        mean_train_loss = np.mean(train_losses)\n        mean_train_dice = np.mean(train_dice_scores)\n        mean_val_loss = np.mean(val_losses)\n        mean_val_dice = np.mean(val_dice_scores)\n        history.append({\n            'epoch': epoch+1,\n            'train_loss': mean_train_loss,\n            'train_dice': mean_train_dice,\n            'val_loss': mean_val_loss,\n            'val_dice': mean_val_dice\n        })\n        # Early stopping logic\n        if mean_val_dice > best_val_dice + 1e-4:  # improved\n            best_val_dice = mean_val_dice\n            best_model_wts = copy.deepcopy(model.state_dict())\n            epochs_no_improve = 0\n        else:\n            epochs_no_improve += 1\n        if epochs_no_improve >= patience:\n            # Early stop\n            break\n\n    model.load_state_dict(best_model_wts)\n    return model, history\n\n# ---- Component: evaluate_model ----\n\ndef evaluate_model(\n    model, dataset_dict, dataloader_dict, device:torch.device, threshold:float=0.5\n):\n    \"\"\"\n    Evaluates trained model on test set, returns mean Dice.\n    \"\"\"\n    model = model.to(device)\n    model.eval()\n    test_loader = dataloader_dict['test']\n    dice_scores = []\n    with torch.no_grad():\n        for imgs, masks in test_loader:\n            imgs = imgs.to(device, non_blocking=True)\n            masks = masks.to(device, non_blocking=True)\n            logits = model(imgs)\n            dice = dice_coefficient(logits, masks, threshold)\n            dice_scores.append(dice)\n    mean_dice = float(np.mean(dice_scores))\n    return mean_dice\n\n# ---- Component: main ----\n\ndef main():\n    \"\"\"\n    Full end-to-end workflow as required.\n    Returns:\n        model: trained U-Net\n        test_dice: mean Dice score on test set\n    \"\"\"\n    # ---- Set configuration ---\n    DATA_PATH = r\"E:\\python_project_new\\brain_case_study\\lgg-mri-segmentation\\case_study\"\n    IMAGE_SIZE = 256    # resize images to 256x256\n    BATCH_SIZE = 8      # can adjust as per hardware\n    NUM_WORKERS = 2     # adjust if needed\n    NUM_EPOCHS = 40     # can tune\n    LEARNING_RATE = 1e-3\n    PATIENCE = 6\n    DICE_LOSS_WEIGHT = 0.4  # Blend of BCE and Dice loss\n    N_INPUT_CHANNELS = 3\n    N_OUTPUT_CLASSES = 1\n    DROPOUT = 0.1\n    AUG_CROP_PERCENT = 0.0   # not used in this code\n    TRAIN_VAL_SPLIT = 0.0    # not used, explicit split\n\n    device = torch.device(\"cuda\" if torch.cuda.is_available() else \"cpu\")\n\n    # ---- Data Loading & Preprocessing ---\n    dataset_dict, dataloader_dict = load_and_preprocess_dataset(\n        DATA_PATH, IMAGE_SIZE, BATCH_SIZE, NUM_WORKERS, AUG_CROP_PERCENT, TRAIN_VAL_SPLIT\n    )\n\n    # ---- Build model ---\n    model = UNet(N_INPUT_CHANNELS, N_OUTPUT_CLASSES, dropout=DROPOUT)\n\n    # ---- Training ---\n    model, history = train_segmentation_model(\n        model, dataset_dict, dataloader_dict, num_epochs=NUM_EPOCHS,\n        learning_rate=LEARNING_RATE, device=device,\n        patience=PATIENCE, dice_loss_weight=DICE_LOSS_WEIGHT\n    )\n\n    # ---- Evaluation ---\n    test_dice = evaluate_model(\n        model, dataset_dict, dataloader_dict, device=device, threshold=0.5\n    )\n\n    return model, test_dice\n\n# ---- Component: plot_prediction_results ----\n\ndef plot_prediction_results(model, dataset_dict, dataloader_dict, device, n_samples=4):\n    \"\"\"\n    Visualizes results on test set by showing input image, GT mask, and predicted mask.\n    \"\"\"\n    import matplotlib.pyplot as plt\n\n    model = model.to(device)\n    model.eval()\n    test_loader = dataloader_dict['test']\n    shown = 0\n    with torch.no_grad():\n        for imgs, masks in test_loader:\n            imgs = imgs.to(device, non_blocking=True)\n            masks = masks.to(device, non_blocking=True)\n            logits = model(imgs)\n            probs = torch.sigmoid(logits)\n            preds = (probs > 0.5).float()\n            batch = imgs.shape[0]\n            for i in range(batch):\n                if shown >= n_samples:\n                    return\n                image_np = imgs[i].cpu().numpy()\n                # Un-normalize for display (per slice)\n                img_disp = image_np\n                # Keep display in 0-1\n                img_disp = img_disp - img_disp.min()\n                img_disp = img_disp / (img_disp.max()+1e-8)\n                img_disp = np.transpose(img_disp, (1,2,0)) # CHW to HWC\n\n                gt_mask_np = masks[i].cpu().numpy()[0]\n                pred_mask_np = preds[i].cpu().numpy()[0]\n\n                fig, axs = plt.subplots(1,3, figsize=(12,4))\n                axs[0].imshow(img_disp, cmap='gray')\n                axs[0].set_title(\"Input Image\")\n                axs[0].axis('off')\n                axs[1].imshow(gt_mask_np, cmap='Reds', alpha=0.7)\n                axs[1].set_title(\"Ground Truth Mask\")\n                axs[1].axis('off')\n                axs[2].imshow(img_disp, cmap='gray')\n                axs[2].imshow(pred_mask_np, cmap='winter', alpha=0.5)\n                axs[2].set_title(\"Predicted Mask Overlay\")\n                axs[2].axis('off')\n                plt.tight_layout()\n                plt.show()\n                shown += 1",
                "plan": "Step-by-step explanation of the code's workflow:\n\n1. **Data Loading and Preprocessing:**\n   - Using `load_and_preprocess_dataset`, the function navigates the dataset structure, matching 3-channel .tif images with their corresponding 1-channel mask .tif files by filename conventions.\n   - A custom PyTorch `Dataset` (`BrainMRISegmentationDataset`) loads these pairs, applies:\n     - Per-image z-score normalization,\n     - Random flips and rotations for training augmentation,\n     - Resizing both image and mask to a uniform `image_size` (default 256x256). Images are always kept 3-channel, masks as 1-channel binary.\n   - Datasets split into train, val, test; respective DataLoaders are created for batching.\n\n2. **Model Definition (U-Net):**\n   - Defines a U-Net architecture for 2D segmentation, using double convolution blocks with batch normalization and dropout (configurable).\n   - Flexible for input channels (default 3, pseudo-RGB) and output classes (default 1 for binary).\n\n3. **Dice Coefficient Calculation:**\n   - Implements a function to compute the Dice score between predicted and ground truth masks, ensuring correct thresholding/binarization and robust to all-zero cases (returns 1 if both empty).\n\n4. **Training Procedure:**\n   - `train_segmentation_model` handles the main epoch loop:\n     - Each epoch: model trains on batches from the train loader, minimizing a combined BCEWithLogitsLoss and (1-Dice) loss (weighted sum).\n     - Per-epoch validation computes mean loss and mean validation Dice.\n     - Early stopping based on validation Dice, saving the best weights.\n\n5. **Model Evaluation:**\n   - Uses `evaluate_model` to compute the average Dice score across the test set's images.\n\n6. **Main Pipeline (`main`):**\n   - Top-level configuration (filepaths, sizes, learning parameters, device).\n   - Loads data, instantiates the U-Net, trains, evaluates on the test set, and returns both the trained model and mean test Dice.\n\n7. **Visualization:**\n   - `plot_prediction_results` helps qualitative evaluation of predictions, showing test input image, ground truth, and overlayed predictions for a sample of images.\n\nAll critical paths (data, model, training, evaluation, visualization) are modular and support full reproducibility and quick adaptation to changes in configuration or experimental setup.",
                "main_function_name": "main",
                "score": 0.12529366902017822,
                "pass_rate": 0.0,
                "pass_rate_score": 0.0,
                "prediction_score": 0.0,
                "pylint_score": 0.773,
                "radon_score": 0.4799366902017821,
                "test_case_results": {
                    "runnability_check": {
                        "success": false,
                        "reason": "test_failed",
                        "message": "code is not runnable, error: Traceback (most recent call last):\n  File \"<string>\", line 4, in test_function\n  File \"<string>\", line 368, in main\n  File \"<string>\", line 259, in train_segmentation_model\n  File \"d:\\anaconda3\\envs\\llm\\lib\\site-packages\\torch\\utils\\data\\dataloader.py\", line 439, in __iter__\n    return self._get_iterator()\n  File \"d:\\anaconda3\\envs\\llm\\lib\\site-packages\\torch\\utils\\data\\dataloader.py\", line 387, in _get_iterator\n    return _MultiProcessingDataLoaderIter(self)\n  File \"d:\\anaconda3\\envs\\llm\\lib\\site-packages\\torch\\utils\\data\\dataloader.py\", line 1040, in __init__\n    w.start()\n  File \"d:\\anaconda3\\envs\\llm\\lib\\multiprocessing\\process.py\", line 121, in start\n    self._popen = self._Popen(self)\n  File \"d:\\anaconda3\\envs\\llm\\lib\\multiprocessing\\context.py\", line 224, in _Popen\n    return _default_context.get_context().Process._Popen(process_obj)\n  File \"d:\\anaconda3\\envs\\llm\\lib\\multiprocessing\\context.py\", line 327, in _Popen\n    return Popen(process_obj)\n  File \"d:\\anaconda3\\envs\\llm\\lib\\multiprocessing\\popen_spawn_win32.py\", line 93, in __init__\n    reduction.dump(process_obj, to_child)\n  File \"d:\\anaconda3\\envs\\llm\\lib\\multiprocessing\\reduction.py\", line 60, in dump\n    ForkingPickler(file, protocol).dump(obj)\n_pickle.PicklingError: Can't pickle <class 'BrainMRISegmentationDataset'>: attribute lookup BrainMRISegmentationDataset on builtins failed\n"
                    }
                },
                "test_weights": {
                    "runnability_check": 0.007100591715976331
                }
            }
        },
        "1": {
            "code_0": {
                "code": "import os\nimport numpy as np\nimport torch\nimport torch.nn as nn\nimport torch.nn.functional as F\nfrom torch.utils.data import Dataset, DataLoader\nfrom PIL import Image\nimport random\nimport copy\nimport matplotlib.pyplot as plt\n\n# ========== Helper Classes and Functions: must be defined at global level! ==========\n\nclass BrainMRISegmentationDataset(Dataset):\n    \"\"\"\n    PyTorch Dataset for FLAIR brain MRI and binary masks.\n    Handles per-image normalization, resizing, augmentation.\n    \"\"\"\n    def __init__(self, image_mask_pairs, image_size=256, is_train=False):\n        super().__init__()\n        self.image_mask_pairs = image_mask_pairs  # List of (img_path, mask_path)\n        self.image_size = image_size\n        self.is_train = is_train\n\n    def __len__(self):\n        return len(self.image_mask_pairs)\n\n    def __getitem__(self, idx):\n        img_path, mask_path = self.image_mask_pairs[idx]\n        \n        # Load and preprocess image (as RGB)\n        image = Image.open(img_path).convert('RGB')\n        # Load and preprocess mask (as L for 1-channel)\n        mask = Image.open(mask_path).convert('L')\n        \n        # Convert to np arrays (image: float32, mask: uint8)\n        image = np.array(image).astype(np.float32)\n        mask = np.array(mask).astype(np.uint8)\n        \n        # Ensure mask is binary (0/1)\n        mask = (mask > 0).astype(np.float32)\n        \n        # Per-image z-score normalization (channel-wise)\n        img_mean = image.mean()\n        img_std = image.std()\n        image = (image - img_mean) / (img_std + 1e-8)\n        \n        # Data augmentation (train only, apply same to mask)\n        if self.is_train:\n            if random.random() > 0.5:  # Horizontal flip\n                image = np.flip(image, axis=1)\n                mask = np.flip(mask, axis=1)\n            if random.random() > 0.5:  # Vertical flip\n                image = np.flip(image, axis=0)\n                mask = np.flip(mask, axis=0)\n            # Random rotate 90/180/270/none\n            if random.random() > 0.5:\n                k = random.choice([1, 2, 3])\n                image = np.rot90(image, k, axes=(0, 1))\n                mask = np.rot90(mask, k, axes=(0, 1))\n        \n        # Resize both to uniform size\n        # For image: use bilinear, mask: nearest\n        image = Image.fromarray(((image - image.min()) / (image.max() - image.min() + 1e-8) * 255).astype(np.uint8))\n        image = image.resize((self.image_size, self.image_size), resample=Image.BILINEAR)\n        image = np.array(image).astype(np.float32)\n        # Per-image z-score again after resize (for better numeric stability)\n        img_mean = image.mean()\n        img_std = image.std()\n        image = (image - img_mean) / (img_std + 1e-8)\n\n        mask = Image.fromarray((mask * 255).astype(np.uint8))\n        mask = mask.resize((self.image_size, self.image_size), resample=Image.NEAREST)\n        mask = np.array(mask).astype(np.float32)\n        mask = (mask > 127).astype(np.float32)\n\n        # HWC -> CHW for image, (H, W) -> (1, H, W) for mask\n        image = np.transpose(image, (2, 0, 1))  # (3,H,W)\n        mask = mask[None, :, :]  # (1,H,W)\n        \n        # Convert to tensor\n        return torch.from_numpy(image).float(), torch.from_numpy(mask).float()\n\ndef create_image_mask_pairs(images_dir, masks_dir):\n    \"\"\"\n    Returns matched (image_path, mask_path) pairs, ensuring mask exists.\n    \"\"\"\n    image_files = [f for f in os.listdir(images_dir) if f.endswith('.tif')]\n    pairs = []\n    for img_file in image_files:\n        base = img_file[:-4]\n        mask_file = f\"{base}_mask.tif\"\n        img_path = os.path.join(images_dir, img_file)\n        mask_path = os.path.join(masks_dir, mask_file)\n        if os.path.exists(mask_path):\n            pairs.append((img_path, mask_path))\n    return pairs\n\ndef load_and_preprocess_dataset(base_path: str, image_size: int, batch_size: int, num_workers: int=0):\n    \"\"\"\n    Loads and preprocesses data into PyTorch DataLoaders for train/val/test.\n    Returns:\n        dataset_dict: {split: Dataset}\n        dataloader_dict: {split: DataLoader}\n    \"\"\"\n    splits = ['train', 'val', 'test']\n    dataset_dict = {}\n    dataloader_dict = {}\n    for split in splits:\n        images_dir = os.path.join(base_path, split, \"images\")\n        masks_dir = os.path.join(base_path, split, \"masks\")\n        pairs = create_image_mask_pairs(images_dir, masks_dir)\n        is_train = split == 'train'\n        dataset = BrainMRISegmentationDataset(pairs, image_size=image_size, is_train=is_train)\n        shuffle = is_train\n        # num_workers=0 for maximum Windows/compatibility robustness (no pickle issues)\n        loader = DataLoader(dataset, batch_size=batch_size, shuffle=shuffle, num_workers=num_workers, pin_memory=True, drop_last=False)\n        dataset_dict[split] = dataset\n        dataloader_dict[split] = loader\n    return dataset_dict, dataloader_dict\n\nclass DoubleConv(nn.Module):\n    \"\"\"\n    Two (Conv2d -> BN -> ReLU) operations as a single block (used in U-Net).\n    \"\"\"\n    def __init__(self, in_ch, out_ch, dropout=0.0):\n        super().__init__()\n        layers = [\n            nn.Conv2d(in_ch, out_ch, kernel_size=3, padding=1, bias=False),\n            nn.BatchNorm2d(out_ch),\n            nn.ReLU(inplace=True),\n            nn.Conv2d(out_ch, out_ch, kernel_size=3, padding=1, bias=False),\n            nn.BatchNorm2d(out_ch),\n            nn.ReLU(inplace=True)\n        ]\n        if dropout > 0:\n            layers.append(nn.Dropout2d(dropout))\n        self.block = nn.Sequential(*layers)\n    def forward(self, x):\n        return self.block(x)\n\nclass UNet(nn.Module):\n    \"\"\"\n    Standard 2D U-Net implementation for semantic segmentation.\n    \"\"\"\n    def __init__(self, in_channels=3, out_channels=1, dropout=0.1):\n        super().__init__()\n        chs = [64, 128, 256, 512, 1024]\n        # Encoder\n        self.inc = DoubleConv(in_channels, chs[0], dropout)\n        self.down1 = nn.Sequential(nn.MaxPool2d(2), DoubleConv(chs[0], chs[1], dropout))\n        self.down2 = nn.Sequential(nn.MaxPool2d(2), DoubleConv(chs[1], chs[2], dropout))\n        self.down3 = nn.Sequential(nn.MaxPool2d(2), DoubleConv(chs[2], chs[3], dropout))\n        self.down4 = nn.Sequential(nn.MaxPool2d(2), DoubleConv(chs[3], chs[4], dropout))\n        # Decoder\n        self.up1 = nn.ConvTranspose2d(chs[4], chs[3], 2, stride=2)\n        self.conv1 = DoubleConv(chs[4], chs[3], dropout)\n        self.up2 = nn.ConvTranspose2d(chs[3], chs[2], 2, stride=2)\n        self.conv2 = DoubleConv(chs[3], chs[2], dropout)\n        self.up3 = nn.ConvTranspose2d(chs[2], chs[1], 2, stride=2)\n        self.conv3 = DoubleConv(chs[2], chs[1], dropout)\n        self.up4 = nn.ConvTranspose2d(chs[1], chs[0], 2, stride=2)\n        self.conv4 = DoubleConv(chs[1], chs[0], dropout)\n        self.outc = nn.Conv2d(chs[0], out_channels, kernel_size=1)\n    def forward(self, x):\n        x1 = self.inc(x)    # (B,64,H,W)\n        x2 = self.down1(x1) # (B,128,H/2,W/2)\n        x3 = self.down2(x2) # (B,256,H/4,W/4)\n        x4 = self.down3(x3) # (B,512,H/8,W/8)\n        x5 = self.down4(x4) # (B,1024,H/16,W/16)\n\n        u1 = self.up1(x5)\n        u1 = torch.cat([u1, x4], dim=1)\n        u1 = self.conv1(u1)\n        u2 = self.up2(u1)\n        u2 = torch.cat([u2, x3], dim=1)\n        u2 = self.conv2(u2)\n        u3 = self.up3(u2)\n        u3 = torch.cat([u3, x2], dim=1)\n        u3 = self.conv3(u3)\n        u4 = self.up4(u3)\n        u4 = torch.cat([u4, x1], dim=1)\n        u4 = self.conv4(u4)\n        out = self.outc(u4)\n        return out\n\ndef dice_coefficient(pred_logits: torch.Tensor, gt_mask: torch.Tensor, threshold: float=0.5):\n    \"\"\"\n    Computes the Dice coefficient for binary segmentation (element-wise).\n    pred_logits: raw logits from model, (B,1,H,W)\n    gt_mask: ground truth mask, (B,1,H,W)\n    threshold: sigmoid(logits) > threshold -> foreground.\n    Returns: average Dice across batch (float).\n    \"\"\"\n    prob = torch.sigmoid(pred_logits)\n    pred = (prob > threshold).float()\n    gt = (gt_mask > 0.5).float()\n    batch = pred.shape[0]\n    dices = []\n    for i in range(batch):\n        pi = pred[i].view(-1)\n        gi = gt[i].view(-1)\n        intersection = (pi * gi).sum()\n        denom = pi.sum() + gi.sum()\n        if denom == 0:\n            dices.append(1.0)  # If both empty, count as perfect!\n        else:\n            dices.append(float(2. * intersection / (denom + 1e-8)))\n    return float(np.mean(dices))\n\ndef train_segmentation_model(model, dataset_dict, dataloader_dict, num_epochs: int, learning_rate: float,\n                            device: torch.device, patience: int=8, dice_loss_weight: float=0.4):\n    \"\"\"\n    Trains the U-Net with BCEWithLogitsLoss + Dice loss. Early stop on best val Dice.\n    \"\"\"\n    model = model.to(device)\n    optimizer = torch.optim.Adam(model.parameters(), lr=learning_rate)\n    bce_loss_fn = nn.BCEWithLogitsLoss()\n    best_val_dice = -np.inf\n    best_state = copy.deepcopy(model.state_dict())\n    epochs_no_improve = 0\n    history = []\n\n    for epoch in range(num_epochs):\n        model.train()\n        epoch_loss = []\n        epoch_dice = []\n        for img, msk in dataloader_dict['train']:\n            img = img.to(device)\n            msk = msk.to(device)\n            optimizer.zero_grad()\n            out = model(img)\n            bce = bce_loss_fn(out, msk)\n            dice = 1 - dice_coefficient(out.detach(), msk.detach())\n            loss = (1-dice_loss_weight)*bce + dice_loss_weight * dice\n            loss.backward()\n            optimizer.step()\n            epoch_loss.append(loss.item())\n            epoch_dice.append(1-dice)\n\n        # Validation\n        model.eval()\n        val_loss = []\n        val_dice = []\n        with torch.no_grad():\n            for img, msk in dataloader_dict['val']:\n                img = img.to(device)\n                msk = msk.to(device)\n                out = model(img)\n                bce = bce_loss_fn(out, msk)\n                dice = 1 - dice_coefficient(out, msk)\n                vloss = (1-dice_loss_weight)*bce + dice_loss_weight*dice\n                val_loss.append(vloss.item())\n                val_dice.append(1-dice)\n        mean_val_dice = np.mean(val_dice)\n        if mean_val_dice > best_val_dice + 1e-5:\n            best_val_dice = mean_val_dice\n            best_state = copy.deepcopy(model.state_dict())\n            epochs_no_improve = 0\n        else:\n            epochs_no_improve += 1\n        history.append({\n            'epoch': epoch+1,\n            'train_loss': np.mean(epoch_loss),\n            'train_dice': np.mean(epoch_dice),\n            'val_loss': np.mean(val_loss),\n            'val_dice': mean_val_dice\n        })\n        # Early stopping\n        if epochs_no_improve >= patience:\n            break\n    model.load_state_dict(best_state)\n    return model, history\n\ndef evaluate_model(model, dataset_dict, dataloader_dict, device, threshold=0.5):\n    \"\"\"\n    Evaluates the trained model on test set. Returns mean Dice score.\n    \"\"\"\n    model = model.to(device)\n    model.eval()\n    dices = []\n    with torch.no_grad():\n        for img, msk in dataloader_dict['test']:\n            img = img.to(device)\n            msk = msk.to(device)\n            out = model(img)\n            dice = dice_coefficient(out, msk, threshold)\n            dices.append(dice)\n    return float(np.mean(dices))\n\ndef plot_prediction_results(model, dataset_dict, dataloader_dict, device, n_samples=4):\n    \"\"\"\n    Display several segmentation predictions (image, gt, pred) from test set.\n    \"\"\"\n    model = model.to(device)\n    model.eval()\n    shown = 0\n    with torch.no_grad():\n        for img, msk in dataloader_dict['test']:\n            img = img.to(device)\n            msk = msk.to(device)\n            out = model(img)\n            prob = torch.sigmoid(out)\n            pred = (prob > 0.5).float()\n            batch = img.shape[0]\n            for i in range(batch):\n                if shown >= n_samples:\n                    return\n                # Prepare display\n                # Undo normalization: scale input to (0,1)\n                npimg = img[i].cpu().numpy()\n                npimg_disp = npimg - npimg.min()\n                npimg_disp = npimg_disp / (npimg_disp.max() + 1e-8)\n                npimg_disp = np.transpose(npimg_disp, (1,2,0))  # HWC\n                gt_mask = msk[i,0].cpu().numpy()\n                pred_mask = pred[i,0].cpu().numpy()\n                fig, axs = plt.subplots(1,3, figsize=(12,4))\n                axs[0].imshow(npimg_disp, cmap='gray')\n                axs[0].set_title('Input Image')\n                axs[0].axis('off')\n                axs[1].imshow(gt_mask, cmap='Reds', interpolation='none')\n                axs[1].set_title('Ground Truth Mask')\n                axs[1].axis('off')\n                axs[2].imshow(npimg_disp, cmap='gray')\n                axs[2].imshow(pred_mask, cmap='winter', alpha=0.5)\n                axs[2].set_title('Predicted Mask Overlay')\n                axs[2].axis('off')\n                plt.tight_layout()\n                plt.show()\n                shown += 1\n\n# ========== Main entrypoint function ==========\n\ndef main():\n    \"\"\"\n    MAIN FUNCTION: Load data, train model, evaluate test dice, and return model + test dice.\n    Returns:\n        model (trained UNet)\n        test_dice (float): mean Dice coefficient on the test set\n    \"\"\"\n    # --- Configuration ---\n    DATA_PATH = r\"E:\\python_project_new\\brain_case_study\\lgg-mri-segmentation\\case_study\"\n    IMAGE_SIZE = 256\n    BATCH_SIZE = 8\n    NUM_EPOCHS = 40\n    LEARNING_RATE = 1e-3\n    PATIENCE = 6\n    DICE_LOSS_WEIGHT = 0.4\n    N_INPUT_CHANNELS = 3\n    N_OUTPUT_CLASSES = 1\n    DROPOUT = 0.1\n    NUM_WORKERS = 0  # Crucial for Windows/pickling compatibility\n\n    # --- Device ---\n    device = torch.device(\"cuda\" if torch.cuda.is_available() else \"cpu\")\n\n    # --- Load data ---\n    dataset_dict, dataloader_dict = load_and_preprocess_dataset(\n        DATA_PATH, IMAGE_SIZE, BATCH_SIZE, num_workers=NUM_WORKERS\n    )\n\n    # --- Build model ---\n    model = UNet(N_INPUT_CHANNELS, N_OUTPUT_CLASSES, dropout=DROPOUT)\n\n    # --- Train model ---\n    model, history = train_segmentation_model(\n        model, dataset_dict, dataloader_dict,\n        num_epochs=NUM_EPOCHS, learning_rate=LEARNING_RATE,\n        device=device, patience=PATIENCE,\n        dice_loss_weight=DICE_LOSS_WEIGHT\n    )\n\n    # --- Evaluate test dice ---\n    test_dice = evaluate_model(\n        model, dataset_dict, dataloader_dict, device, threshold=0.5\n    )\n\n    return model, test_dice",
                "plan": "1. **Dataset & Preprocessing**: \n    - The dataset class loads each image and its corresponding mask pair, normalizes intensity using z-score, binarizes masks, resizes both, and applies data augmentation (flip/rotate) during training. All conversions to torch tensors and required shape changes are handled.\n    - The loader function scans each split's directory for image/mask pairs, uses batch loaders, and crucially sets `num_workers=0` to avoid pickling errors, ensuring compatibility on all platforms/environments.\n\n2. **Model Definition**: \n    - A classic U-Net model (encoder-decoder with skip connections, batchnorm, dropout) is implemented with flexibility for dropout and channel numbers.\n    - DoubleConv blocks are used for repeated Conv-BN-ReLU stacks.\n\n3. **Training Pipeline**:\n    - The training function combines BCEWithLogitsLoss (robust for binary segmentation) and Dice loss, using early stopping monitored via the validation Dice.\n    - The best model (by validation) is retained and reloaded at the end before returning.\n\n4. **Evaluation**:\n    - The evaluation function computes the averaged Dice coefficient over the whole test set using sigmoid-thresholded logits.\n\n5. **Visualization**:\n    - The visualization/plotting function draws N sample predictions from the test set: It shows the input image, ground truth, and predicted mask overlay for fast visual quality checking.\n\n6. **Main Pipeline (`main` function)**:\n    - Sets all hyperparameters/configs.\n    - Loads data and applies full preprocessing.\n    - Builds model.\n    - Trains with early stopping.\n    - Evaluates on test set, returning trained model and test dice value.\n\n**All classes and functions are defined at the global level to ensure maximum compatibility with PyTorch DataLoader and multiprocessing, avoiding pickling errors.**",
                "main_function_name": "main",
                "score": 0.12806891234678547,
                "pass_rate": 0.0,
                "pass_rate_score": 0.0,
                "prediction_score": 0.0,
                "pylint_score": 0.798,
                "radon_score": 0.4826891234678544,
                "test_case_results": {
                    "runnability_check": {
                        "success": false,
                        "reason": "timeout",
                        "message": "Process did not finish within the allowed time"
                    }
                },
                "test_weights": {
                    "runnability_check": 0.00109239872553482
                }
            }
        },
        "2": {
            "code_0": {
                "code": "import os\nimport numpy as np\nimport torch\nimport torch.nn as nn\nimport torch.nn.functional as F\nfrom torch.utils.data import Dataset, DataLoader\nfrom PIL import Image\nimport random\nimport copy\nimport matplotlib.pyplot as plt\n\n# ------- Dataset Class --------\nclass BrainMRISegmentationDataset(Dataset):\n    \"\"\"\n    Custom PyTorch Dataset for loading pairs of brain MRI slices and corresponding masks.\n    Handles per-image normalization, resizing, and (optionally) augmentation.\n    \"\"\"\n    def __init__(\n        self,\n        pairs,\n        image_size=128,\n        is_train=False,\n        augment_prob=0.5\n    ):\n        self.pairs = pairs\n        self.image_size = image_size\n        self.is_train = is_train\n        self.augment_prob = augment_prob\n\n    def __len__(self):\n        return len(self.pairs)\n\n    def __getitem__(self, idx):\n        img_path, mask_path = self.pairs[idx]\n        # Load image (as RGB)\n        image = Image.open(img_path).convert('RGB')\n        # Load mask (as single channel)\n        mask = Image.open(mask_path).convert('L')\n\n        # Convert to numpy\n        image = np.array(image).astype(np.float32)\n        mask = np.array(mask).astype(np.uint8)\n\n        # Ensure binary mask [0,1]\n        mask = (mask > 0).astype(np.float32)\n\n        # Per-image normalization (z-score for all channels)\n        img_mean = image.mean()\n        img_std = image.std()\n        if img_std < 1e-6: img_std = 1.0\n        image = (image - img_mean) / img_std\n\n        # Data augmentation for training\n        if self.is_train:\n            # Horizontal flip\n            if random.random() < self.augment_prob:\n                image = np.flip(image, axis=1)\n                mask = np.flip(mask, axis=1)\n            # Vertical flip\n            if random.random() < self.augment_prob:\n                image = np.flip(image, axis=0)\n                mask = np.flip(mask, axis=0)\n            # Random rotation\n            if random.random() < self.augment_prob:\n                k = random.choice([1, 2, 3])  # 90,180,270 degrees\n                image = np.rot90(image, k, axes=(0, 1))\n                mask = np.rot90(mask, k, axes=(0, 1))\n\n        # Resize: for images, use bilinear; for masks, use nearest\n        image = Image.fromarray(\n            np.clip(\n                (((image - image.min()) / (image.max() - image.min() + 1e-8)) * 255),\n                0, 255).astype(np.uint8)\n        ).resize((self.image_size, self.image_size), Image.BILINEAR)\n        image = np.array(image).astype(np.float32)\n        # After resize: normalization again (for safety)\n        img_mean = image.mean()\n        img_std = image.std()\n        image = (image - img_mean) / (img_std + 1e-8)\n\n        mask = Image.fromarray((mask * 255).astype(np.uint8))\n        mask = mask.resize((self.image_size, self.image_size), Image.NEAREST)\n        mask = np.array(mask).astype(np.float32)\n        mask = (mask > 127).astype(np.float32)\n\n        # HWC -> CHW\n        if image.ndim == 2:\n            image = np.stack([image, image, image], axis=2)\n        image = np.transpose(image, (2, 0, 1))  # (3,H,W)\n        mask = mask[None, :, :]  # (1,H,W)\n\n        return torch.from_numpy(image).float(), torch.from_numpy(mask).float()\n\ndef create_pairs(images_dir, masks_dir, max_samples=None):\n    \"\"\"\n    Get list of (image_path, mask_path) pairs. Limit to max_samples if set.\n    \"\"\"\n    image_files = [f for f in os.listdir(images_dir) if f.endswith('.tif')]\n    pairs = []\n    for fname in image_files:\n        base = fname[:-4]\n        mask_fname = f\"{base}_mask.tif\"\n        img_path = os.path.join(images_dir, fname)\n        mask_path = os.path.join(masks_dir, mask_fname)\n        if os.path.exists(mask_path):\n            pairs.append((img_path, mask_path))\n    # Optionally shuffle and subsample\n    random.shuffle(pairs)\n    if max_samples is not None:\n        pairs = pairs[:max_samples]\n    return pairs\n\ndef load_datasets(\n    base_path, image_size=128, batch_size=4, num_workers=0, max_train=100, max_val=20, max_test=20\n):\n    \"\"\"\n    Load datasets and DataLoaders for train/val/test sets.\n    \"\"\"\n    splits = ['train', 'val', 'test']\n    max_by_split = {'train': max_train, 'val': max_val, 'test': max_test}\n    dataset_dict = {}\n    dataloader_dict = {}\n    for split in splits:\n        img_dir = os.path.join(base_path, split, 'images')\n        mask_dir = os.path.join(base_path, split, 'masks')\n        max_samples = max_by_split[split]\n        pairs = create_pairs(img_dir, mask_dir, max_samples=max_samples)\n        is_train = (split == 'train')\n        dataset = BrainMRISegmentationDataset(pairs, image_size=image_size, is_train=is_train)\n        shuffle = is_train\n        loader = DataLoader(dataset, batch_size=batch_size, shuffle=shuffle, num_workers=num_workers, pin_memory=False)\n        dataset_dict[split] = dataset\n        dataloader_dict[split] = loader\n    return dataset_dict, dataloader_dict\n\n# ------- UNet model (Lightweight) --------\nclass DoubleConv(nn.Module):\n    \"\"\"(Conv2d -> BN -> ReLU) * 2\"\"\"\n    def __init__(self, in_ch, out_ch):\n        super().__init__()\n        self.double_conv = nn.Sequential(\n            nn.Conv2d(in_ch, out_ch, kernel_size=3, padding=1, bias=False),\n            nn.BatchNorm2d(out_ch),\n            nn.ReLU(inplace=True),\n            nn.Conv2d(out_ch, out_ch, kernel_size=3, padding=1, bias=False),\n            nn.BatchNorm2d(out_ch),\n            nn.ReLU(inplace=True)\n        )\n    def forward(self, x):\n        return self.double_conv(x)\n\nclass UNetLite(nn.Module):\n    \"\"\"Lightweight U-Net for 2D segmentation\"\"\"\n    def __init__(self, in_ch=3, out_ch=1):\n        super().__init__()\n        chs = [16, 32, 64, 128, 256]\n        # Encoder\n        self.inc = DoubleConv(in_ch, chs[0])\n        self.down1 = nn.Sequential(nn.MaxPool2d(2), DoubleConv(chs[0], chs[1]))\n        self.down2 = nn.Sequential(nn.MaxPool2d(2), DoubleConv(chs[1], chs[2]))\n        self.down3 = nn.Sequential(nn.MaxPool2d(2), DoubleConv(chs[2], chs[3]))\n        self.down4 = nn.Sequential(nn.MaxPool2d(2), DoubleConv(chs[3], chs[4]))\n        # Decoder\n        self.up1 = nn.ConvTranspose2d(chs[4], chs[3], kernel_size=2, stride=2)\n        self.conv1 = DoubleConv(chs[4], chs[3])\n        self.up2 = nn.ConvTranspose2d(chs[3], chs[2], kernel_size=2, stride=2)\n        self.conv2 = DoubleConv(chs[3], chs[2])\n        self.up3 = nn.ConvTranspose2d(chs[2], chs[1], kernel_size=2, stride=2)\n        self.conv3 = DoubleConv(chs[2], chs[1])\n        self.up4 = nn.ConvTranspose2d(chs[1], chs[0], kernel_size=2, stride=2)\n        self.conv4 = DoubleConv(chs[1], chs[0])\n        self.outc = nn.Conv2d(chs[0], out_ch, kernel_size=1)\n    def forward(self, x):\n        x1 = self.inc(x)\n        x2 = self.down1(x1)\n        x3 = self.down2(x2)\n        x4 = self.down3(x3)\n        x5 = self.down4(x4)\n        u1 = self.up1(x5)\n        u1 = torch.cat([u1, x4], dim=1)\n        u1 = self.conv1(u1)\n        u2 = self.up2(u1)\n        u2 = torch.cat([u2, x3], dim=1)\n        u2 = self.conv2(u2)\n        u3 = self.up3(u2)\n        u3 = torch.cat([u3, x2], dim=1)\n        u3 = self.conv3(u3)\n        u4 = self.up4(u3)\n        u4 = torch.cat([u4, x1], dim=1)\n        u4 = self.conv4(u4)\n        return self.outc(u4)\n\n# ------- Dice Coefficient --------\ndef dice_coefficient(pred_logits, target, threshold=0.5, eps=1e-7):\n    \"\"\"\n    pred_logits: model output, shape (B,1,H,W)\n    target: ground truth, shape (B,1,H,W)\n    Returns: average Dice over batch\n    \"\"\"\n    pred = torch.sigmoid(pred_logits)\n    pred = (pred > threshold).float()\n    target = (target > 0.5).float()\n    intersection = (pred * target).sum(dim=(2, 3))\n    unionset = pred.sum(dim=(2, 3)) + target.sum(dim=(2, 3))\n    dice = (2 * intersection + eps) / (unionset + eps)\n    # If both mask and pred are all zero, count as perfect Dice = 1.0\n    zeros = ((target.sum(dim=(2,3))==0) & (pred.sum(dim=(2,3))==0))\n    dice = torch.where(zeros, torch.ones_like(dice), dice)\n    return dice.mean().item()\n\nclass DiceLoss(nn.Module):\n    def __init__(self, eps=1e-7):\n        super().__init__()\n        self.eps = eps\n    def forward(self, logits, targets):\n        inputs = torch.sigmoid(logits)\n        targets = (targets > 0.5).float()\n        intersection = (inputs * targets).sum(dim=(2,3))\n        unionset = inputs.sum(dim=(2,3)) + targets.sum(dim=(2,3))\n        dice = (2 * intersection + self.eps) / (unionset + self.eps)\n        loss = 1 - dice\n        return loss.mean()\n\n# ------- Train and Evaluate --------\ndef train_model(\n    model,\n    dataloader_dict,\n    device,\n    n_epochs=10,\n    lr=1e-3,\n    patience=2,\n):\n    optimizer = torch.optim.Adam(model.parameters(), lr=lr)\n    bce_loss = nn.BCEWithLogitsLoss()\n    dice_loss = DiceLoss()\n    best_state = copy.deepcopy(model.state_dict())\n    best_val_dice = -np.inf\n    epochs_no_improve = 0\n    for ep in range(n_epochs):\n        model.train()\n        train_loss = []\n        train_dice = []\n        for x, y in dataloader_dict['train']:\n            x = x.to(device)\n            y = y.to(device)\n            optimizer.zero_grad()\n            pred = model(x)\n            loss = 0.5*bce_loss(pred, y) + 0.5*dice_loss(pred, y)\n            loss.backward()\n            optimizer.step()\n            train_loss.append(loss.item())\n            train_dice.append(dice_coefficient(pred, y))\n        # Validation\n        model.eval()\n        val_loss = []\n        val_dice = []\n        with torch.no_grad():\n            for x, y in dataloader_dict['val']:\n                x = x.to(device)\n                y = y.to(device)\n                pred = model(x)\n                loss = 0.5*bce_loss(pred, y) + 0.5*dice_loss(pred, y)\n                val_loss.append(loss.item())\n                val_dice.append(dice_coefficient(pred, y))\n        avg_val_dice = np.mean(val_dice)\n        # Early stopping\n        if avg_val_dice > best_val_dice + 1e-4:\n            best_val_dice = avg_val_dice\n            best_state = copy.deepcopy(model.state_dict())\n            epochs_no_improve = 0\n        else:\n            epochs_no_improve += 1\n        if epochs_no_improve >= patience:\n            break\n    model.load_state_dict(best_state)\n    return model\n\ndef evaluate_model(model, dataloader, device):\n    \"\"\"\n    Return average Dice score on dataloader set.\n    \"\"\"\n    model.eval()\n    dices = []\n    with torch.no_grad():\n        for x, y in dataloader:\n            x = x.to(device)\n            y = y.to(device)\n            pred = model(x)\n            dice = dice_coefficient(pred, y)\n            dices.append(dice)\n    mean_dice = float(np.mean(dices)) if len(dices) > 0 else 0.0\n    return mean_dice\n\n# ------- Visualization ---------\ndef plot_test_predictions(model, dataloader, device, n_samples=4):\n    \"\"\"\n    Show input/test image, ground truth, and model prediction side by side.\n    \"\"\"\n    model.eval()\n    shown = 0\n    with torch.no_grad():\n        for x, y in dataloader:\n            x = x.to(device)\n            y = y.to(device)\n            pred = model(x)\n            pred_probs = torch.sigmoid(pred)\n            pred_mask = (pred_probs > 0.5).float()\n            bs = x.shape[0]\n            for i in range(bs):\n                if shown >= n_samples:\n                    return\n                img_np = x[i].cpu().numpy()\n                img_np = img_np - img_np.min()\n                img_np = img_np / (img_np.max() + 1e-8)\n                img_np = np.transpose(img_np, (1,2,0))  # HWC\n                gt_mask = y[i,0].cpu().numpy()\n                pr_mask = pred_mask[i,0].cpu().numpy()\n                # Plot\n                fig, axs = plt.subplots(1,3, figsize=(12,4))\n                axs[0].imshow(img_np, cmap='gray')\n                axs[0].set_title('Input Image')\n                axs[0].axis('off')\n                axs[1].imshow(gt_mask, cmap='Reds')\n                axs[1].set_title('Ground truth')\n                axs[1].axis('off')\n                axs[2].imshow(img_np, cmap='gray')\n                axs[2].imshow(pr_mask, cmap='Blues', alpha=0.5)\n                axs[2].set_title('Prediction Overlay')\n                axs[2].axis('off')\n                plt.tight_layout()\n                plt.show()\n                shown += 1\n\n# ------------- MAIN PIPELINE ---------------\ndef main():\n    \"\"\"\n    Loads data, trains segmentation model, returns model and average Dice on test set.\n    \"\"\"\n    # ---- Settings (tuned for quick/robust test) ----\n    DATA_PATH = r\"E:\\python_project_new\\brain_case_study\\lgg-mri-segmentation\\case_study\"\n    IMG_SIZE = 128        # Small input size for speed\n    BATCH_SIZE = 4\n    N_EPOCHS = 10\n    LR = 1e-3\n    PATIENCE = 2\n    MAX_TRAIN = 100      # Dataset size limits for speed\n    MAX_VAL = 20\n    MAX_TEST = 20\n    NUM_WORKERS = 0      # for compatibility\n    # ---- Device ----\n    device = torch.device('cuda' if torch.cuda.is_available() else 'cpu')\n    # ---- Data load ----\n    dataset_dict, dataloader_dict = load_datasets(\n        DATA_PATH,\n        image_size=IMG_SIZE,\n        batch_size=BATCH_SIZE,\n        num_workers=NUM_WORKERS,\n        max_train=MAX_TRAIN,\n        max_val=MAX_VAL,\n        max_test=MAX_TEST\n    )\n    # ---- Model ----\n    model = UNetLite(in_ch=3, out_ch=1).to(device)\n    # ---- Train ----\n    model = train_model(\n        model,\n        dataloader_dict,\n        device,\n        n_epochs=N_EPOCHS,\n        lr=LR,\n        patience=PATIENCE\n    )\n    # ---- Evaluate test set ----\n    test_dice = evaluate_model(model, dataloader_dict['test'], device)\n    return model, test_dice\n\n# --------- Separate function for plotting ---------------\ndef plot_test_results(model, dataloader_dict, device, n_samples=4):\n    \"\"\"\n    Plots segmentation results for a few test samples.\n    \"\"\"\n    plot_test_predictions(model, dataloader_dict['test'], device, n_samples=n_samples)",
                "plan": "1. **Data Loading and Preprocessing:**\n   - Collects matching pairs of image and mask files for train/val/test splits. \n   - Each sample is loaded, normalized (per-slice z-score), and resized to a small square (128x128) for quick training and evaluation.\n   - For training mode, random augmentations (flips, rotations) are applied synchronously to both image and mask.\n   - Dataset loading is capped to a manageable number of samples per split to ensure rapid execution and avoid timeouts.\n\n2. **Dataloader Preparation:**\n   - Each dataset is wrapped in a PyTorch DataLoader for fast and batched access.\n\n3. **Model Definition:**\n   - Implements a lightweight U-Net with fewer channels per layer.\n   - Fewer model parameters speed up both forward and backward passes, reducing runtime and memory footprint.\n\n4. **Loss and Metric:**\n   - Standard BCEWithLogitsLoss is combined with a soft Dice loss to enhance segmentation overlap (accuracy).\n   - Dice coefficient (main metric) is calculated per-image and averaged.\n\n5. **Training Loop:**\n   - Early stopping is used with reduced patience and epoch count for efficient testing and fast convergence.\n   - Each epoch tracks loss and Dice metric.\n   - Best model (by validation Dice) is restored after training.\n\n6. **Testing/Evaluation:**\n   - Computes mean Dice coefficient on limited test set.\n\n7. **Output:**\n   - Returns trained model and test Dice score.\n\n8. **Visualization:**\n   - The plot_test_results function shows a few test samples: input, ground truth, and predicted mask overlays for qualitative assessment.",
                "main_function_name": "main",
                "score": 0.8277716091499688,
                "pass_rate": 1.0,
                "pass_rate_score": 1.0,
                "prediction_score": 0.0,
                "pylint_score": 0.826,
                "radon_score": 0.4517160914996891,
                "test_case_results": {
                    "runnability_check": {
                        "success": true,
                        "reason": null,
                        "message": "code is runnable"
                    }
                },
                "test_weights": {
                    "runnability_check": 0.00109239872553482
                }
            }
        }
    },
    {
        "0": {
            "code_0": {
                "code": "import os\nimport random\nimport numpy as np\nfrom PIL import Image\nimport torch\nimport torch.nn as nn\nimport torch.nn.functional as F\nfrom torch.utils.data import Dataset, DataLoader\nfrom torchvision import transforms\nimport matplotlib.pyplot as plt\n\n# -------------------------- Component: set_random_seed --------------------------\ndef set_random_seed(seed):\n    \"\"\"\n    Set random seed for reproducibility across random, numpy, and torch.\n\n    Args:\n        seed (int): seed value.\n    \"\"\"\n    random.seed(seed)\n    np.random.seed(seed)\n    torch.manual_seed(seed)\n    torch.backends.cudnn.deterministic = True\n    torch.backends.cudnn.benchmark = False\n    if torch.cuda.is_available():\n        torch.cuda.manual_seed_all(seed)\n\n# -------------------------- Component: get_image_mask_pairs --------------------------\ndef get_image_mask_pairs(images_dir, masks_dir):\n    \"\"\"\n    Pairs image paths and their corresponding mask paths by filename convention.\n\n    Args:\n        images_dir (str): Path to images directory.\n        masks_dir (str): Path to masks directory.\n\n    Returns:\n        image_paths (list): List of matched image paths.\n        mask_paths (list): List of matched mask paths.\n    \"\"\"\n    images = sorted([f for f in os.listdir(images_dir) if f.lower().endswith('.tif')])\n    image_paths = []\n    mask_paths = []\n    for image_fname in images:\n        # construct corresponding mask filename\n        base = image_fname[:-4]  # Removes .tif\n        mask_fname = f\"{base}_mask.tif\"\n        mask_full = os.path.join(masks_dir, mask_fname)\n        image_full = os.path.join(images_dir, image_fname)\n        if os.path.exists(mask_full):\n            image_paths.append(image_full)\n            mask_paths.append(mask_full)\n    return image_paths, mask_paths\n\n# -------------------------- Component: MRI2DDataset --------------------------\nclass MRI2DDataset(Dataset):\n    \"\"\"\n    Dataset for paired brain MRI slices and FLAIR abnormality masks.\n    \"\"\"\n    def __init__(self, image_paths, mask_paths, target_size=(256,256), augmentation=False):\n        \"\"\"\n        Args:\n            image_paths (list): List of image file paths.\n            mask_paths (list): List of mask file paths.\n            target_size (tuple): Output size (H, W).\n            augmentation (bool): Whether to apply random augmentation.\n        \"\"\"\n        self.image_paths = image_paths\n        self.mask_paths = mask_paths\n        self.target_size = target_size\n        self.augmentation = augmentation\n\n        # Define basic transform (resize only)\n        self.basic_transform = transforms.Compose([\n            transforms.Resize(self.target_size, interpolation=Image.BILINEAR),\n            transforms.ToTensor(),  # scales [0,255] to [0,1]\n        ])\n        self.mask_transform = transforms.Compose([\n            transforms.Resize(self.target_size, interpolation=Image.NEAREST),\n            transforms.ToTensor(),  # keeps binary\n        ])\n\n    def __len__(self):\n        return len(self.image_paths)\n\n    def __getitem__(self, idx):\n        # Load image (3 channels) and mask (1 channel)\n        img = Image.open(self.image_paths[idx]).convert('RGB')\n        mask = Image.open(self.mask_paths[idx]).convert('L')\n\n        # Resize + to Tensor\n        img_tensor = self.basic_transform(img)  # shape: [3,H,W], float32, [0,1]\n        mask_tensor = self.mask_transform(mask)  # shape: [1,H,W], float32, [0,1]\n\n        # Normalize: zero mean, unit var per-channel\n        img_tensor = (img_tensor - img_tensor.mean(dim=(1,2), keepdim=True)) / (img_tensor.std(dim=(1,2), keepdim=True)+1e-7)\n\n        # Data augmentation (same for image and mask)\n        if self.augmentation:\n            # Random horizontal flip\n            if random.random() > 0.5:\n                img_tensor = torch.flip(img_tensor, dims=[2])\n                mask_tensor = torch.flip(mask_tensor, dims=[2])\n            # Random vertical flip\n            if random.random() > 0.5:\n                img_tensor = torch.flip(img_tensor, dims=[1])\n                mask_tensor = torch.flip(mask_tensor, dims=[1])\n            # Random rotation (0,90,180,270)\n            k = random.randint(0,3)\n            if k > 0:\n                img_tensor = torch.rot90(img_tensor, k=k, dims=[1,2])\n                mask_tensor = torch.rot90(mask_tensor, k=k, dims=[1,2])\n            # Random intensity scaling\n            scale = 0.9 + 0.2 * random.random()\n            img_tensor = img_tensor * scale\n            # Add random brightness\n            img_tensor = img_tensor + (random.uniform(-0.1, 0.1))\n            # Clamp to avoid extreme values after normalization\n            img_tensor = torch.clamp(img_tensor, -3, 3)\n\n        mask_tensor = (mask_tensor > 0.5).float()  # ensure binary\n        return img_tensor, mask_tensor\n\n# -------------------------- Component: get_data_loaders --------------------------\ndef get_data_loaders(base_path, target_size=(256,256), batch_size=6, num_workers=2):\n    \"\"\"\n    Prepare DataLoaders for train/val/test splits.\n\n    Args:\n        base_path (str): Root dataset path.\n        target_size (tuple): Resize/hw.\n        batch_size (int): batch size.\n        num_workers (int): DataLoader parallel workers.\n\n    Returns:\n        dict: {'train', 'val', 'test'} keys each mapping to a DataLoader.\n    \"\"\"\n    splits = ['train', 'val', 'test']\n    data_loaders = {}\n    for split in splits:\n        images_dir = os.path.join(base_path, split, 'images')\n        masks_dir = os.path.join(base_path, split, 'masks')\n        image_paths, mask_paths = get_image_mask_pairs(images_dir, masks_dir)\n        # Augment only training data\n        is_train = split == 'train'\n        dataset = MRI2DDataset(image_paths, mask_paths, target_size=target_size, augmentation=is_train)\n        loader = DataLoader(dataset, batch_size=batch_size, shuffle=is_train, num_workers=num_workers, pin_memory=torch.cuda.is_available())\n        data_loaders[split] = loader\n    return data_loaders\n\n# -------------------------- Component: UNet --------------------------\nclass DoubleConv(nn.Module):\n    def __init__(self, in_ch, out_ch):\n        super().__init__()\n        self.double_conv = nn.Sequential(\n            nn.Conv2d(in_ch, out_ch, kernel_size=3, padding=1),\n            nn.ReLU(inplace=True),\n            nn.Conv2d(out_ch, out_ch, kernel_size=3, padding=1),\n            nn.ReLU(inplace=True),\n        )\n    def forward(self, x):\n        return self.double_conv(x)\n\nclass UNet(nn.Module):\n    \"\"\"\n    U-Net implementation suitable for medical image segmentation.\n    \"\"\"\n    def __init__(self, n_channels=3, n_classes=1):\n        super().__init__()\n        self.in_conv    = DoubleConv(n_channels, 16)\n        self.down1      = nn.Sequential(nn.MaxPool2d(2), DoubleConv(16, 32))\n        self.down2      = nn.Sequential(nn.MaxPool2d(2), DoubleConv(32, 64))\n        self.down3      = nn.Sequential(nn.MaxPool2d(2), DoubleConv(64, 128))\n        self.down4      = nn.Sequential(nn.MaxPool2d(2), DoubleConv(128, 256))\n        # Decoder\n        self.up1        = nn.ConvTranspose2d(256, 128, kernel_size=2, stride=2)\n        self.dec1       = DoubleConv(256, 128)\n        self.up2        = nn.ConvTranspose2d(128, 64, kernel_size=2, stride=2)\n        self.dec2       = DoubleConv(128, 64)\n        self.up3        = nn.ConvTranspose2d(64, 32, kernel_size=2, stride=2)\n        self.dec3       = DoubleConv(64, 32)\n        self.up4        = nn.ConvTranspose2d(32, 16, kernel_size=2, stride=2)\n        self.dec4       = DoubleConv(32, 16)\n        self.out_conv   = nn.Conv2d(16, n_classes, kernel_size=1)\n\n    def forward(self, x):\n        # Encode\n        x1 = self.in_conv(x)   # [B,16,H,W]\n        x2 = self.down1(x1)    # [B,32,H/2,W/2]\n        x3 = self.down2(x2)    # [B,64,H/4,W/4]\n        x4 = self.down3(x3)    # [B,128,H/8,W/8]\n        x5 = self.down4(x4)    # [B,256,H/16,W/16]\n        # Decode\n        u1 = self.up1(x5)\n        u1 = torch.cat([crop_like(x4, u1), u1], dim=1)\n        d1 = self.dec1(u1)\n        u2 = self.up2(d1)\n        u2 = torch.cat([crop_like(x3, u2), u2], dim=1)\n        d2 = self.dec2(u2)\n        u3 = self.up3(d2)\n        u3 = torch.cat([crop_like(x2, u3), u3], dim=1)\n        d3 = self.dec3(u3)\n        u4 = self.up4(d3)\n        u4 = torch.cat([crop_like(x1, u4), u4], dim=1)\n        d4 = self.dec4(u4)\n        out = self.out_conv(d4)\n        return out\n\n# Helper for cropping encoder feature map to match decoder upsampled size\ndef crop_like(feat, target):\n    \"\"\"\n    Center crop feat to match spatial size of target.\n    \"\"\"\n    if feat.shape[2:] == target.shape[2:]:\n        return feat\n    diff_y = feat.shape[2] - target.shape[2]\n    diff_x = feat.shape[3] - target.shape[3]\n    return feat[:,:, diff_y//2:feat.shape[2]-(diff_y - diff_y//2), diff_x//2:feat.shape[3]-(diff_x-diff_x//2)]\n\n# -------------------------- Component: dice_coefficient --------------------------\ndef dice_coefficient(pred_mask, true_mask, epsilon=1e-7):\n    \"\"\"\n    Computes Dice coefficient for batched binary masks.\n\n    Args:\n        pred_mask (torch.Tensor): [B,1,H,W], values [0,1] (after sigmoid).\n        true_mask (torch.Tensor): [B,1,H,W], binary {0,1}.\n        epsilon (float): Smoothing term.\n\n    Returns:\n        float: Average Dice over batch.\n    \"\"\"\n    with torch.no_grad():\n        pred_bin = (pred_mask > 0.5).float()\n        true_bin = (true_mask > 0.5).float()\n        # Flatten\n        pred_flat = pred_bin.view(pred_bin.size(0), -1)\n        true_flat = true_bin.view(true_bin.size(0), -1)\n        intersection = (pred_flat * true_flat).sum(dim=1)\n        dice = (2. * intersection + epsilon) / (pred_flat.sum(dim=1) + true_flat.sum(dim=1) + epsilon)\n        return dice.mean().item()\n\n# -------------------------- Component: train_unet --------------------------\ndef train_unet(model, train_loader, val_loader, num_epochs, learning_rate, device):\n    \"\"\"\n    Trains U-Net on train_loader, validates on val_loader.\n\n    Args:\n        model (UNet): segmentation model.\n        train_loader (DataLoader): train data.\n        val_loader (DataLoader): validation data.\n        num_epochs (int): training epochs.\n        learning_rate (float): optimizer lr.\n        device (torch.device): cuda/cpu.\n\n    Returns:\n        UNet: trained model (best val dice).\n        float: best validation dice.\n    \"\"\"\n    model = model.to(device)\n    optimizer = torch.optim.Adam(model.parameters(), lr=learning_rate)\n    criterion = nn.BCEWithLogitsLoss()\n    best_dice = 0.0\n    best_weights = None\n    for epoch in range(num_epochs):\n        model.train()\n        running_loss = 0.0\n        for images, masks in train_loader:\n            images = images.to(device, dtype=torch.float32)\n            masks  = masks.to(device, dtype=torch.float32)\n            optimizer.zero_grad()\n            logits = model(images)\n            # [B,1,H,W] after sigmoid\n            loss = criterion(logits, masks)\n            loss.backward()\n            optimizer.step()\n            running_loss += loss.item() * images.size(0)\n        train_loss = running_loss / len(train_loader.dataset)\n        # Validation\n        model.eval()\n        dices = []\n        with torch.no_grad():\n            for images, masks in val_loader:\n                images = images.to(device, dtype=torch.float32)\n                masks  = masks.to(device, dtype=torch.float32)\n                logits = model(images)\n                probs = torch.sigmoid(logits)\n                dice = dice_coefficient(probs, masks)\n                dices.append(dice)\n        mean_dice = np.mean(dices)\n        if mean_dice > best_dice:\n            best_dice = mean_dice\n            best_weights = model.state_dict()\n        # Optionally, print epoch status\n        # print(f\"[{epoch+1}/{num_epochs}] Train loss: {train_loss:.3f}  | Val Dice: {mean_dice:.4f}\")\n    # Load best weights\n    if best_weights is not None:\n        model.load_state_dict(best_weights)\n    return model, best_dice\n\n# -------------------------- Component: evaluate_model --------------------------\ndef evaluate_model(model, data_loader, device):\n    \"\"\"\n    Evaluate model on a dataloader and returns mean Dice + sample predictions.\n\n    Args:\n        model (UNet): trained model\n        data_loader (DataLoader): test loader\n        device (torch.device): cpu/gpu\n\n    Returns:\n        mean_dice (float): average Dice over set\n        example_images (list): up to 8 image tensors [3,H,W]\n        example_gt_masks (list): up to 8 GT mask tensors [1,H,W]\n        example_pred_masks (list): up to 8 predicted mask tensors [1,H,W]\n    \"\"\"\n    model.eval()\n    model = model.to(device)\n    dices = []\n    max_examples = 8\n    example_images = []\n    example_gt_masks = []\n    example_pred_masks = []\n    with torch.no_grad():\n        for images, masks in data_loader:\n            images = images.to(device, dtype=torch.float32)\n            masks  = masks.to(device, dtype=torch.float32)\n            logits = model(images)\n            probs = torch.sigmoid(logits)\n            preds = (probs > 0.5).float()\n            # Dice over batch\n            dice = dice_coefficient(probs, masks)\n            dices.append(dice)\n            # Collect up to max_examples for visualization\n            if len(example_images) < max_examples:\n                needed = max_examples - len(example_images)\n                for i in range(min(images.size(0), needed)):\n                    # Detach; take CPU for visualization\n                    example_images.append(images[i].cpu())\n                    example_gt_masks.append(masks[i].cpu())\n                    example_pred_masks.append(preds[i].cpu())\n    mean_dice = np.mean(dices) if dices else 0.0\n    return mean_dice, example_images, example_gt_masks, example_pred_masks\n\n# -------------------------- Component: plot_predictions --------------------------\ndef plot_predictions(example_images, example_gt_masks, example_pred_masks, N=6):\n    \"\"\"\n    Plots predicted and ground-truth segmentation masks overlaid on MRI images.\n\n    Args:\n        example_images (list): [N, 3,H,W] tensors (in normalized space).\n        example_gt_masks (list): [N,1,H,W] tensors.\n        example_pred_masks (list): [N,1,H,W] tensors.\n        N (int): number of examples to plot.\n    \"\"\"\n    n = min(N, len(example_images))\n    plt.figure(figsize=(n * 4.5, 12))\n    for i in range(n):\n        img = example_images[i].clone()\n        # Undo normalization for display: rescale channels\n        img_disp = img.numpy()\n        img_disp = img_disp - img_disp.min()\n        img_disp = img_disp / (img_disp.max() + 1e-10)\n        img_disp = np.transpose(img_disp, (1,2,0))  # [H,W,3]\n\n        gt_mask = example_gt_masks[i].squeeze().numpy()  # [H,W]\n        pred_mask = example_pred_masks[i].squeeze().numpy()  # [H,W]\n\n        # --- subplot 1: input image ---\n        plt.subplot(3, n, i+1)\n        plt.imshow(img_disp)\n        plt.axis('off')\n        plt.title('MRI Slice')\n\n        # --- subplot 2: gt overlay ---\n        plt.subplot(3, n, n + i+1)\n        plt.imshow(img_disp, alpha=1)\n        plt.imshow(gt_mask, cmap='jet', alpha=0.5)\n        plt.axis('off')\n        plt.title('Ground Truth Mask')\n\n        # --- subplot 3: pred overlay ---\n        plt.subplot(3, n, 2*n + i+1)\n        plt.imshow(img_disp, alpha=1)\n        plt.imshow(pred_mask, cmap='spring', alpha=0.5)\n        plt.axis('off')\n        plt.title('Predicted Mask')\n    plt.tight_layout()\n    plt.show()\n\n# -------------------------- Component: main (Full Pipeline) --------------------------\ndef main():\n    \"\"\"\n    Full pipeline for MRI FLAIR abnormality segmentation.\n    Returns:\n        model (UNet): trained model\n        test_dice (float): average Dice on test set\n        example_images (list[Tensor])\n        example_gt_masks (list[Tensor])\n        example_pred_masks (list[Tensor])\n    \"\"\"\n    # --- Step 1: Set random seed for reproducibility ---\n    set_random_seed(42)\n\n    # --- Step 2: Prepare DataLoaders ---\n    base_path = r\"E:\\python_project_new\brain_case_study\\lgg-mri-segmentation\\case_study\"\n    target_size = (256, 256)\n    batch_size = 6\n    num_workers = 2 if torch.cuda.is_available() else 0\n    loaders = get_data_loaders(base_path, target_size=target_size, batch_size=batch_size, num_workers=num_workers)\n    train_loader = loaders['train']\n    val_loader = loaders['val']\n    test_loader = loaders['test']\n\n    # --- Step 3: Initialize model ---\n    model = UNet(n_channels=3, n_classes=1)\n\n    # --- Step 4: Train model ---\n    n_epochs = 18\n    lr = 1e-3\n    device = torch.device('cuda' if torch.cuda.is_available() else 'cpu')\n    model, best_val_dice = train_unet(model, train_loader, val_loader, n_epochs, lr, device)\n\n    # --- Step 5: Evaluate on test set ---\n    test_dice, example_images, example_gt_masks, example_pred_masks = evaluate_model(model, test_loader, device)\n\n    # --- Step 6: Return model, test dice, and examples for plotting ---\n    return model, test_dice, example_images, example_gt_masks, example_pred_masks\n\n# -- end all components --",
                "plan": "Step-by-step workflow of the complete code:\n\n1. **Reproducibility**: The `set_random_seed` function ensures consistent, repeatable results each run by setting seeds for python, numpy, torch and torch.cuda across training and evaluation.\n\n2. **Data Pairing**: `get_image_mask_pairs` reads all MRI slice image filenames in a given images/ directory, creates mask filenames using the \"_mask.tif\" naming rule, verifies mask existence, and returns ordered, matched lists of absolute image and mask file paths.\n\n3. **Dataset Preparation**: `MRI2DDataset` is a PyTorch `Dataset` that:\n    - Loads MRI images as 3-channel RGB and corresponding masks as grayscale (L mode).\n    - Resizes both images and masks (using bilinear and nearest-neighbor interpolation, respectively) to a common shape.\n    - Converts images to tensor, normalizes them (zero mean, unit variance per-slice), and ensures masks are always binary {0,1}.\n    - If augmentation is enabled (train set), applies the same random flips, rotations, and intensity adjustments to both image and mask, ensuring spatial correspondence.\n\n4. **DataLoader Construction**: `get_data_loaders` automates train/val/test DataLoader creation, utilizing the paired lists and MRI2DDataset, toggling augmentation for training, and providing correct shuffling and batching.\n\n5. **Model Definition**: A UNet implementation that:\n    - Accepts 3-channel input and outputs a single-channel segmentation map.\n    - Stacks double conv blocks, max-pooling for downsampling, transposed convolutions for upsampling, and skip connections between mirroring encoder/decoder blocks.\n    - Ensures feature map alignment via a `crop_like` helper.\n\n6. **Metric**: `dice_coefficient` applies a threshold to outputs, flattens masks, and computes the Dice coefficient per-image, returning their mean.\n\n7. **Training**: `train_unet` iterates over epochs:\n    - Standard training on train_loader with BCEWithLogits loss.\n    - At epoch end, switches to evaluation mode, computes validation Dice coefficient.\n    - Tracks the best-validation Dice and reloads the corresponding model weights at the end.\n\n8. **Evaluation**: `evaluate_model` performs full-test inference:\n    - Collects per-batch dice scores.\n    - Collects up to 8 sample (image, gt mask, pred mask) sets for plotting.\n\n9. **Visualization**: `plot_predictions` takes a few test examples and, for each:\n    - Displays the input MRI slice.\n    - Overlays ground-truth and predicted binary masks (with transparency/heatmap coloring) for visual assessment.\n\n10. **Main Orchestration**: `main()` executes all steps in order:\n    - Sets seed, prepares data, builds the model, trains and validates, loads the best weights, evaluates on test, and collects predictions.\n    - Exposes for outside use: the trained model, test Dice metric, and a set of test images and their corresponding predictions.",
                "main_function_name": "main",
                "score": 0.13435519583857286,
                "pass_rate": 0.0,
                "pass_rate_score": 0.0,
                "prediction_score": 0.0,
                "pylint_score": 0.828,
                "radon_score": 0.5155519583857288,
                "test_case_results": {
                    "runnability_check": {
                        "success": false,
                        "reason": "test_failed",
                        "message": "code is not runnable, error: Traceback (most recent call last):\n  File \"<string>\", line 4, in test_function\n  File \"<string>\", line 410, in main\n  File \"<string>\", line 143, in get_data_loaders\n  File \"<string>\", line 41, in get_image_mask_pairs\nOSError: [WinError 123] 文件名、目录名或卷标语法不正确。: 'E:\\\\python_project_new\\x08rain_case_study\\\\lgg-mri-segmentation\\\\case_study\\\\train\\\\images'\n"
                    }
                },
                "test_weights": {
                    "runnability_check": 0.007100591715976331
                }
            }
        },
        "1": {
            "code_0": {
                "code": "base_path = r\"E:\\python_project_new\brain_case_study\\lgg-mri-segmentation\\case_study\"",
                "plan": "**Step-by-step workflow:**\n1. **Reproducibility**: `set_random_seed` ensures all randomness (Python, Numpy, Torch) is controlled.\n2. **Data Loading**:\n   - File pairing uses `get_image_mask_pairs`, carefully joining images and masks by filename convention.\n   - DataLoader setup in `get_data_loaders` for train/val/test splits, applying augmentation only to train.\n3. **Dataset Preprocessing**:\n   - Each image is zero-mean/unit-variance normalized per channel.\n   - Images and masks resized to `target_size`.\n   - Augmentation (random flip, rotate, brightness/contrast) applied in training.\n4. **Model Definition**:\n   - U-Net with batch normalization and skip connections.\n   - `crop_like` for correct spatial alignment of encoder and decoder feature maps.\n5. **Training Function**:\n   - Trains for `n_epochs` with binary cross-entropy loss (including logits).\n   - Keeps best validation Dice weights.\n6. **Evaluation**:\n   - Runs on test loader.\n   - Collects mean Dice and up to 8 sample images/masks/predictions for qualitative review.\n7. **Plotting**:\n   - Function to visualize overlayed images, ground truth and predictions for qualitative assessment.\n   - Separate `plot_test_examples_on_testset` for plotting after model training.\n8. **Integration in Main**:\n   - The `main` function sets up everything: seed, dataloaders, U-Net, training, testing, and returns trained model, Dice, and representative predictions for inspection.\n9. **I/O Contract**:\n   - `main()` accepts no arguments, returns (model, test_dice, example_images, example_gt_masks, example_pred_masks)\n   - Visualization is handled via an auxiliary plotting function.",
                "main_function_name": "main",
                "score": 0.1,
                "pass_rate": 0.0,
                "pass_rate_score": 0.0,
                "prediction_score": 0.0,
                "pylint_score": 0.0,
                "radon_score": 1.0,
                "test_case_results": {
                    "runnability_check": {
                        "success": false,
                        "reason": "main_func_compile_error",
                        "message": "Main function 'main' not found or not callable"
                    }
                },
                "test_weights": {
                    "runnability_check": 0.001
                }
            }
        },
        "2": {
            "code_0": {
                "code": "import os\nimport random\nimport numpy as np\nfrom glob import glob\n\nimport torch\nfrom torch import nn\nfrom torch.utils.data import Dataset, DataLoader\nimport torch.nn.functional as F\nfrom torchvision import transforms\nfrom PIL import Image\nimport matplotlib.pyplot as plt\n\n# ======================\n# 1. Reproducibility Seed\n# ======================\ndef set_seed(seed=42):\n    random.seed(seed)\n    np.random.seed(seed)\n    torch.manual_seed(seed)\n    torch.cuda.manual_seed_all(seed)\n\n# ======================\n# 2. Dataset Class\n# ======================\nclass MRISegmentationDataset(Dataset):\n    def __init__(self, images_dir, masks_dir, augment=False, image_size=(256, 256)):\n        self.image_paths = sorted(glob(os.path.join(images_dir, \"*.tif\")))\n        self.mask_paths = [\n            os.path.join(masks_dir, os.path.basename(f).replace('.tif', '_mask.tif')) \n            for f in self.image_paths\n        ]\n        self.augment = augment\n        self.image_size = image_size\n\n    def __len__(self):\n        return len(self.image_paths)\n\n    def __getitem__(self, idx):\n        # Load image (kept 3-channel as per data format)\n        img = Image.open(self.image_paths[idx]).convert('RGB')\n        mask = Image.open(self.mask_paths[idx]).convert('L')\n        \n        # Resize\n        img = img.resize(self.image_size, resample=Image.BILINEAR)\n        mask = mask.resize(self.image_size, resample=Image.NEAREST)\n        \n        # Convert to array\n        img = np.array(img).astype(np.float32) # (H,W,3)\n        mask = np.array(mask).astype(np.float32) # (H,W)\n        mask = mask / 255.0  # ensure mask is in [0,1]\n\n        # Slice-wise normalization to [0,1]\n        img = (img - img.min()) / (img.max() - img.min() + 1e-8)\n\n        # Augmentation\n        if self.augment:\n            if random.random() > 0.5:\n                img = np.fliplr(img)\n                mask = np.fliplr(mask)\n            if random.random() > 0.5:\n                img = np.flipud(img)\n                mask = np.flipud(mask)\n            if random.random() > 0.5:\n                angle = random.choice([90, 180, 270])\n                img = np.rot90(img, k=angle//90)\n                mask = np.rot90(mask, k=angle//90)\n            if random.random() > 0.5:\n                # Random brightness\n                factor = 0.9 + 0.2 * random.random()\n                img = img * factor\n                img = np.clip(img, 0, 1)\n\n        # To tensor, shape: (C,H,W)\n        img = torch.from_numpy(img.transpose(2,0,1))  # [3,H,W]\n        mask = torch.from_numpy(mask).unsqueeze(0)    # [1,H,W]\n        mask = (mask > 0.5).float()\n        return img, mask\n\n# ======================\n# 3. U-Net Model\n# ======================\nclass DoubleConv(nn.Module):\n    def __init__(self, in_channels, out_channels):\n        super().__init__()\n        self.seq = nn.Sequential(\n            nn.Conv2d(in_channels, out_channels, 3, padding=1, bias=False),\n            nn.BatchNorm2d(out_channels),\n            nn.ReLU(inplace=True),\n            nn.Conv2d(out_channels, out_channels, 3, padding=1, bias=False),\n            nn.BatchNorm2d(out_channels),\n            nn.ReLU(inplace=True)\n        )\n    def forward(self, x):\n        return self.seq(x)\n\nclass UNet(nn.Module):\n    def __init__(self, in_channels=3, out_channels=1, features=[64, 128, 256, 512]):\n        super().__init__()\n        self.downs = nn.ModuleList()\n        self.ups = nn.ModuleList()\n        # Down part\n        for feature in features:\n            prev = in_channels if len(self.downs)==0 else features[len(self.downs)-1]\n            self.downs.append(DoubleConv(prev, feature))\n        self.pool = nn.MaxPool2d(2,2)\n        # Bottleneck\n        self.bottleneck = DoubleConv(features[-1], features[-1]*2)\n        # Up part\n        for feature in reversed(features):\n            self.ups.append(\n                nn.ConvTranspose2d(feature*2, feature, kernel_size=2, stride=2)\n            )\n            self.ups.append(\n                DoubleConv(feature*2, feature)\n            )\n        self.final_conv = nn.Conv2d(features[0], out_channels, kernel_size=1)\n    def forward(self, x):\n        skips = []\n        for mod in self.downs:\n            x = mod(x)\n            skips.append(x)\n            x = self.pool(x)\n        x = self.bottleneck(x)\n        skips = skips[::-1]\n        for idx in range(0,len(self.ups),2):\n            x = self.ups[idx](x)\n            skip = skips[idx//2]\n            # Sometimes upsampled x and skip may not have equal spatial dims\n            if x.shape[-2:] != skip.shape[-2:]:\n                x = F.interpolate(x, size=skip.shape[-2:], mode=\"bilinear\", align_corners=False)\n            x = torch.cat([skip, x], dim=1)\n            x = self.ups[idx+1](x)\n        return torch.sigmoid(self.final_conv(x))\n\n# ======================\n# 4. Metrics\n# ======================\ndef dice_coefficient(pred, target, threshold=0.5, eps=1e-6):\n    # pred, target in (N,1,H,W)\n    pred = (pred > threshold).float()\n    target = (target > threshold).float()\n    inter = (pred * target).sum(dim=(2,3))\n    union = pred.sum(dim=(2,3)) + target.sum(dim=(2,3))\n    dice = (2*inter + eps)/(union + eps)\n    return dice.mean().item()\n\n# ======================\n# 5. Train, Validate, Test\n# ======================\ndef train_one_epoch(model, dataloader, criterion, optimizer, device):\n    model.train()\n    epoch_loss = 0\n    for images, masks in dataloader:\n        images = images.to(device)\n        masks = masks.to(device)\n        optimizer.zero_grad()\n        outputs = model(images)\n        loss = criterion(outputs, masks)\n        loss.backward()\n        optimizer.step()\n        epoch_loss += loss.item()*images.size(0)\n    return epoch_loss/len(dataloader.dataset)\n\ndef validate(model, dataloader, criterion, device):\n    model.eval()\n    val_loss = 0\n    dices = []\n    with torch.no_grad():\n        for images, masks in dataloader:\n            images = images.to(device)\n            masks = masks.to(device)\n            outputs = model(images)\n            loss = criterion(outputs, masks)\n            val_loss += loss.item()*images.size(0)\n            dices.append(dice_coefficient(outputs.detach().cpu(), masks.cpu()))\n    return val_loss/len(dataloader.dataset), np.mean(dices)\n\ndef test(model, dataloader, device):\n    model.eval()\n    dices = []\n    with torch.no_grad():\n        for images, masks in dataloader:\n            images = images.to(device)\n            masks = masks.to(device)\n            outputs = model(images)\n            dices.append(dice_coefficient(outputs.cpu(), masks.cpu()))\n    return np.mean(dices)\n\n# ======================\n# 6. Main Function\n# ======================\ndef main():\n    set_seed(42)\n    base_path = r\"E:\\python_project_new\brain_case_study\\lgg-mri-segmentation\\case_study\"\n    train_img_dir = os.path.join(base_path, \"train\", \"images\")\n    train_mask_dir = os.path.join(base_path, \"train\", \"masks\")\n    val_img_dir = os.path.join(base_path, \"val\", \"images\")\n    val_mask_dir = os.path.join(base_path, \"val\", \"masks\")\n    test_img_dir = os.path.join(base_path, \"test\", \"images\")\n    test_mask_dir = os.path.join(base_path, \"test\", \"masks\")\n    \n    # Hyper-parameters\n    image_size = (256,256)\n    batch_size = 8\n    lr = 1e-3\n    num_epochs = 25\n    patience = 7\n\n    # CUDA if available\n    device = torch.device(\"cuda\" if torch.cuda.is_available() else \"cpu\")\n\n    # Datasets and loaders\n    train_ds = MRISegmentationDataset(train_img_dir, train_mask_dir, augment=True, image_size=image_size)\n    val_ds = MRISegmentationDataset(val_img_dir, val_mask_dir, augment=False, image_size=image_size)\n    test_ds = MRISegmentationDataset(test_img_dir, test_mask_dir, augment=False, image_size=image_size)\n\n    train_loader = DataLoader(train_ds, batch_size=batch_size, shuffle=True, num_workers=2, pin_memory=True)\n    val_loader = DataLoader(val_ds, batch_size=batch_size, shuffle=False, num_workers=2, pin_memory=True)\n    test_loader = DataLoader(test_ds, batch_size=1, shuffle=False)\n\n    # Model, loss, optimizer\n    model = UNet(in_channels=3, out_channels=1).to(device)\n    criterion = nn.BCELoss()\n    optimizer = torch.optim.Adam(model.parameters(), lr=lr)\n    # Early stopping setup\n    best_val_dice = 0.0\n    best_model_wts = None\n    patience_counter = 0\n\n    for epoch in range(num_epochs):\n        train_loss = train_one_epoch(model, train_loader, criterion, optimizer, device)\n        val_loss, val_dice = validate(model, val_loader, criterion, device)\n        if val_dice > best_val_dice:\n            best_val_dice = val_dice\n            best_model_wts = model.state_dict()\n            patience_counter = 0\n        else:\n            patience_counter += 1\n        # Optionally, print progress (comment out since no print allowed in returned code)\n        # print(f\"Epoch {epoch}: Train Loss {train_loss:.4f} | Val Loss {val_loss:.4f} | Val Dice {val_dice:.4f}\")\n        if patience_counter >= patience:\n            break\n\n    if best_model_wts is not None:\n        model.load_state_dict(best_model_wts)\n    # Evaluate on test set\n    test_dice = test(model, test_loader, device)\n    # Return model instance (with best weights loaded) and best test dice\n    return model, test_dice\n\n# ======================\n# 7. Plot Function\n# ======================\ndef plot_predictions(model, num_samples=4):\n    \"\"\"\n    Plot sample predictions from the test set.\n    :param model: Trained UNet instance\n    :param num_samples: Number of samples to visualize\n    \"\"\"\n    base_path = r\"E:\\python_project_new\brain_case_study\\lgg-mri-segmentation\\case_study\"\n    test_img_dir = os.path.join(base_path, \"test\", \"images\")\n    test_mask_dir = os.path.join(base_path, \"test\", \"masks\")\n    image_size = (256,256)\n    test_ds = MRISegmentationDataset(test_img_dir, test_mask_dir, augment=False, image_size=image_size)\n    model.eval()\n    device = next(model.parameters()).device\n    idxs = np.random.choice(len(test_ds), size=min(num_samples, len(test_ds)), replace=False)\n    fig, axs = plt.subplots(len(idxs), 3, figsize=(12,4*len(idxs)))\n    if len(idxs)==1:\n        axs = [axs]\n    with torch.no_grad():\n        for i, idx in enumerate(idxs):\n            img, msk = test_ds[idx]\n            img_in = img.unsqueeze(0).to(device)\n            pred = model(img_in)\n            pred_mask = (pred[0,0].cpu().numpy() > 0.5).astype(np.uint8)\n            axs[i][0].imshow(img.permute(1,2,0).cpu().numpy(), cmap='gray')\n            axs[i][0].set_title(\"Input image\")\n            axs[i][1].imshow(msk[0].numpy(), cmap='gray')\n            axs[i][1].set_title(\"True mask\")\n            axs[i][2].imshow(img.permute(1,2,0).cpu().numpy(), cmap='gray')\n            axs[i][2].imshow(pred_mask, cmap='Reds', alpha=0.4)\n            axs[i][2].set_title(\"Prediction overlay\")\n            for k in range(3):\n                axs[i][k].axis(\"off\")\n    plt.tight_layout()\n    plt.show()",
                "plan": "1. **Reproducibility**: The script starts by setting global seeds to ensure results are reproducible.\n2. **Custom Dataset**: Defines a PyTorch Dataset class for paired MRI slice images and their binary masks, handling augmentations (flips, rotations, brightness), resizing, and normalization. It ensures each image is correctly paired with its mask by strict filename logic.\n3. **Model Definition (U-Net)**: Implements a classic U-Net architecture with skip connections, using double conv blocks for downsampling and upsampling paths.\n4. **Metrics**: Uses Dice coefficient for evaluation, as is standard for segmentation, with binary masking and handling for averaging.\n5. **Training/Validation/Early Stopping**: Includes separate training and validation loops, and tracks the best validation Dice to implement early stopping. Uses Adam optimizer and BCELoss (since output is after sigmoid).\n6. **Model Output**: The main() function returns the trained PyTorch model instance (with weights) and the average Dice score on the test set (across all test images).\n7. **Visualization**: plot_predictions visualizes test results, showing the input image, ground truth mask, and overlayed predictions, for visual assessment of segmentation quality.\n8. **Separation of Logic**: The script does not execute training or evaluation directly when imported (per requirements) but exposes all necessary functions for external invocation.\n9. **Device Handling**: All tensors and model are moved to GPU if available, for efficiency.\n10. **All parameters and paths are fixed per the task description.**",
                "main_function_name": "main",
                "score": 0.12364583091840309,
                "pass_rate": 0.0,
                "pass_rate_score": 0.0,
                "prediction_score": 0.0,
                "pylint_score": 0.741,
                "radon_score": 0.4954583091840308,
                "test_case_results": {
                    "runnability_check": {
                        "success": false,
                        "reason": "test_failed",
                        "message": "code is not runnable, error: Traceback (most recent call last):\n  File \"<string>\", line 4, in test_function\n  File \"<string>\", line 218, in main\n  File \"d:\\anaconda3\\envs\\llm\\lib\\site-packages\\torch\\utils\\data\\dataloader.py\", line 350, in __init__\n    sampler = RandomSampler(dataset, generator=generator)  # type: ignore[arg-type]\n  File \"d:\\anaconda3\\envs\\llm\\lib\\site-packages\\torch\\utils\\data\\sampler.py\", line 143, in __init__\n    raise ValueError(f\"num_samples should be a positive integer value, but got num_samples={self.num_samples}\")\nValueError: num_samples should be a positive integer value, but got num_samples=0\n"
                    }
                },
                "test_weights": {
                    "runnability_check": 0.001
                }
            }
        },
        "3": {
            "code_0": {
                "code": "import os\nimport random\nimport numpy as np\nfrom glob import glob\nfrom PIL import Image\nimport torch\nfrom torch import nn\nfrom torch.utils.data import Dataset, DataLoader\nimport torch.nn.functional as F\nimport matplotlib.pyplot as plt\n\n# For reproducibility, set seeds\ndef set_seed(seed=42):\n    random.seed(seed)\n    np.random.seed(seed)\n    torch.manual_seed(seed)\n    torch.cuda.manual_seed_all(seed)\n\n# Dataset class for reading and pairing images/masks with optional augmentation\nclass MRISegmentationDataset(Dataset):\n    def __init__(self, images_dir, masks_dir, augment=False, image_size=(256,256)):\n        self.images_dir = images_dir\n        self.masks_dir = masks_dir\n        self.image_size = image_size\n        self.augment = augment\n\n        self.image_paths = sorted(glob(os.path.join(images_dir, '*.tif')))\n        self.mask_paths = []\n        # Pair each image with mask, mask filename is <img_base>_mask.tif\n        for img_path in self.image_paths:\n            img_base = os.path.basename(img_path).replace('.tif', '')\n            mask_path = os.path.join(masks_dir, img_base + '_mask.tif')\n            if os.path.exists(mask_path):\n                self.mask_paths.append(mask_path)\n            else:\n                # Data integrity: if mask does not exist, skip this pair\n                self.mask_paths.append(None)\n        # Remove non-existing pairs\n        valid = [(img, mask) for img, mask in zip(self.image_paths, self.mask_paths) if mask is not None]\n        self.image_paths = [v[0] for v in valid]\n        self.mask_paths = [v[1] for v in valid]\n\n    def __len__(self):\n        return len(self.image_paths)\n\n    def __getitem__(self, idx):\n        # Load image (3 channel RGB tif)\n        img = Image.open(self.image_paths[idx]).convert('RGB')\n        mask = Image.open(self.mask_paths[idx]).convert('L')\n\n        # Resize\n        img = img.resize(self.image_size, resample=Image.BILINEAR)\n        mask = mask.resize(self.image_size, resample=Image.NEAREST)\n\n        # Convert to np arrays\n        img = np.array(img).astype(np.float32)           # shape: (H,W,3)\n        mask = np.array(mask).astype(np.float32)         # shape: (H,W)\n        mask = (mask > 127).astype(np.float32)           # binary mask [0,1]\n\n        # Slice-wise normalization [0,1]\n        img = (img - img.min()) / (img.max() - img.min() + 1e-8)\n\n        # Augmentation: must apply same transform to both\n        if self.augment:\n            if random.random() < 0.5:\n                img = np.fliplr(img)\n                mask = np.fliplr(mask)\n            if random.random() < 0.5:\n                img = np.flipud(img)\n                mask = np.flipud(mask)\n            if random.random() < 0.5:\n                angle = random.choice([1,2,3]) # Rot90: 1=90°, 2=180°, 3=270°\n                img = np.rot90(img, k=angle)\n                mask = np.rot90(mask, k=angle)\n            if random.random() < 0.5:\n                factor = 0.85 + random.uniform(0, 0.3)\n                img = img * factor\n                img = np.clip(img, 0, 1)\n\n        # Change to torch Tensor (CHW)\n        img = torch.from_numpy(img.transpose(2,0,1))    # [3,H,W]\n        mask = torch.from_numpy(mask).unsqueeze(0)       # [1,H,W]\n        return img.float(), mask.float()\n\n# U-Net blocks for encoder-decoder\nclass DoubleConv(nn.Module):\n    def __init__(self, in_channels, out_channels):\n        super().__init__()\n        self.net = nn.Sequential(\n            nn.Conv2d(in_channels, out_channels, kernel_size=3, padding=1, bias=False),\n            nn.BatchNorm2d(out_channels),\n            nn.ReLU(inplace=True),\n            nn.Conv2d(out_channels, out_channels, kernel_size=3, padding=1, bias=False),\n            nn.BatchNorm2d(out_channels),\n            nn.ReLU(inplace=True)\n        )\n    def forward(self, x):\n        return self.net(x)\n\nclass UNet(nn.Module):\n    def __init__(self, in_channels=3, out_channels=1, features=[64,128,256,512]):\n        super().__init__()\n        self.downs = nn.ModuleList()\n        self.ups = nn.ModuleList()\n        # Downsampling path\n        ch_in = in_channels\n        for feat in features:\n            self.downs.append(DoubleConv(ch_in, feat))\n            ch_in = feat\n        self.pool = nn.MaxPool2d(kernel_size=2, stride=2)\n        # Bottleneck\n        self.bottleneck = DoubleConv(features[-1], features[-1]*2)\n        # Upsampling path\n        rev_feats = list(reversed(features))\n        ch_in = features[-1]*2\n        for feat in rev_feats:\n            self.ups.append(\n                nn.ConvTranspose2d(ch_in, feat, kernel_size=2, stride=2)\n            )\n            self.ups.append(DoubleConv(feat*2, feat))\n            ch_in = feat\n        self.final_conv = nn.Conv2d(features[0], out_channels, kernel_size=1)\n    def forward(self, x):\n        skip_connections = []\n        for down_module in self.downs:\n            x = down_module(x)\n            skip_connections.append(x)\n            x = self.pool(x)\n        x = self.bottleneck(x)\n        skip_connections = skip_connections[::-1]\n        for idx in range(0, len(self.ups), 2):\n            x = self.ups[idx](x)\n            skip = skip_connections[idx//2]\n            if x.shape[-2:] != skip.shape[-2:]:\n                x = F.interpolate(x, size=skip.shape[-2:], mode='bilinear', align_corners=False)\n            x = torch.cat([skip, x], dim=1)\n            x = self.ups[idx+1](x)\n        out = self.final_conv(x)\n        return torch.sigmoid(out)\n\n# Dice coefficient calculation utility (batchwise)\ndef dice_coefficient(pred, target, threshold=0.5, eps=1e-6):\n    # pred,target: (N,1,H,W)\n    pred = (pred > threshold).float()\n    target = (target > threshold).float()\n    intersection = (pred * target).sum(dim=(2,3))\n    total = pred.sum(dim=(2,3)) + target.sum(dim=(2,3))\n    dice = (2 * intersection + eps) / (total + eps)\n    return dice.mean().item()\n\n# Training loop (one epoch)\ndef train_one_epoch(model, loader, criterion, optimizer, device):\n    model.train()\n    loss_accum = 0.0\n    for imgs, masks in loader:\n        imgs = imgs.to(device)\n        masks = masks.to(device)\n        optimizer.zero_grad()\n        outputs = model(imgs)\n        loss = criterion(outputs, masks)\n        loss.backward()\n        optimizer.step()\n        loss_accum += loss.item() * imgs.size(0)\n    avg_loss = loss_accum / len(loader.dataset)\n    return avg_loss\n\n# Validation/eval (over val set)\ndef eval_epoch(model, loader, criterion, device):\n    model.eval()\n    loss_accum = 0.0\n    dices = []\n    with torch.no_grad():\n        for imgs, masks in loader:\n            imgs = imgs.to(device)\n            masks = masks.to(device)\n            outputs = model(imgs)\n            loss = criterion(outputs, masks)\n            loss_accum += loss.item() * imgs.size(0)\n            dices.append(dice_coefficient(outputs.cpu(), masks.cpu()))\n    avg_loss = loss_accum / len(loader.dataset)\n    dice_score = np.mean(dices) if dices else 0.0\n    return avg_loss, dice_score\n\n# Test eval (just dice)\ndef test_eval(model, loader, device):\n    model.eval()\n    dices = []\n    with torch.no_grad():\n        for imgs, masks in loader:\n            imgs = imgs.to(device)\n            masks = masks.to(device)\n            outputs = model(imgs)\n            dices.append(dice_coefficient(outputs.cpu(), masks.cpu()))\n    avg_dice = np.mean(dices) if dices else 0.0\n    return avg_dice\n\ndef main():\n    \"\"\"\n    Main function: loads data, trains, evaluates model, returns model and Dice score.\n    \"\"\"\n    set_seed(42)\n    # Data path (sanitize path for Windows)\n    base_path = r\"E:\\python_project_new\\brain_case_study\\lgg-mri-segmentation\\case_study\"\n    train_img_dir = os.path.join(base_path, 'train', 'images')\n    train_mask_dir = os.path.join(base_path, 'train', 'masks')\n    val_img_dir = os.path.join(base_path, 'val', 'images')\n    val_mask_dir = os.path.join(base_path, 'val', 'masks')\n    test_img_dir = os.path.join(base_path, 'test', 'images')\n    test_mask_dir = os.path.join(base_path, 'test', 'masks')\n\n    # Hyperparameters\n    image_size = (256,256)\n    batch_size = 8\n    lr = 1e-3\n    epochs = 25\n    patience = 6\n\n    device = torch.device('cuda' if torch.cuda.is_available() else 'cpu')\n\n    # Datasets - robust to missing data\n    train_ds = MRISegmentationDataset(train_img_dir, train_mask_dir, augment=True, image_size=image_size)\n    val_ds = MRISegmentationDataset(val_img_dir, val_mask_dir, augment=False, image_size=image_size)\n    test_ds = MRISegmentationDataset(test_img_dir, test_mask_dir, augment=False, image_size=image_size)\n\n    # Robust: fail gracefully if any dataset is empty\n    if len(train_ds) == 0:\n        raise RuntimeError(f\"No training images found at {train_img_dir}\")\n    if len(val_ds) == 0:\n        raise RuntimeError(f\"No validation images found at {val_img_dir}\")\n    if len(test_ds) == 0:\n        raise RuntimeError(f\"No test images found at {test_img_dir}\")\n\n    train_loader = DataLoader(train_ds, batch_size=batch_size, shuffle=True, num_workers=2, pin_memory=True)\n    val_loader = DataLoader(val_ds, batch_size=batch_size, shuffle=False, num_workers=2, pin_memory=True)\n    test_loader = DataLoader(test_ds, batch_size=1, shuffle=False)\n\n    # Model, loss, optimizer\n    model = UNet(in_channels=3, out_channels=1).to(device)\n    criterion = nn.BCELoss()\n    optimizer = torch.optim.Adam(model.parameters(), lr=lr)\n\n    # Early stopping on validation Dice\n    best_val_dice = 0.0\n    best_epoch = -1\n    best_weights = None\n    no_improve_epochs = 0\n\n    for epoch in range(epochs):\n        train_loss = train_one_epoch(model, train_loader, criterion, optimizer, device)\n        val_loss, val_dice = eval_epoch(model, val_loader, criterion, device)\n        if val_dice > best_val_dice:\n            best_val_dice = val_dice\n            best_epoch = epoch\n            best_weights = model.state_dict()\n            no_improve_epochs = 0\n        else:\n            no_improve_epochs += 1\n        if no_improve_epochs >= patience:\n            break\n\n    # Restore the best weights\n    if best_weights is not None:\n        model.load_state_dict(best_weights)\n\n    # Evaluate on test set Dice\n    test_dice = test_eval(model, test_loader, device)\n    return model, test_dice\n\ndef plot_predictions(model, num_samples=4):\n    \"\"\"\n    Visualizes predictions from test set. Plots each row as input, GT mask, Predicted mask overlay.\n    \"\"\"\n    base_path = r\"E:\\python_project_new\\brain_case_study\\lgg-mri-segmentation\\case_study\"\n    test_img_dir = os.path.join(base_path, 'test', 'images')\n    test_mask_dir = os.path.join(base_path, 'test', 'masks')\n    image_size = (256,256)\n    test_ds = MRISegmentationDataset(test_img_dir, test_mask_dir, augment=False, image_size=image_size)\n    if len(test_ds) == 0:\n        raise RuntimeError(f\"No test data available for visualization in {test_img_dir}\")\n    # Choose num_samples random unique indices\n    sample_idxs = np.random.choice(len(test_ds), min(num_samples, len(test_ds)), replace=False)\n    device = next(model.parameters()).device\n    model.eval()\n    plt.figure(figsize=(12, 4*len(sample_idxs)))\n    with torch.no_grad():\n        for i, idx in enumerate(sample_idxs):\n            img, mask = test_ds[idx]\n            img_input = img.unsqueeze(0).to(device)\n            pred = model(img_input)\n            pred_mask = (pred[0,0].cpu().numpy() > 0.5).astype(np.uint8)\n            # Plot: input image, true mask, pred overlay\n            plt.subplot(len(sample_idxs), 3, i*3+1)\n            showimg = img.permute(1,2,0).cpu().numpy()\n            plt.imshow(showimg, cmap='gray')\n            plt.title(\"Input Image\")\n            plt.axis(\"off\")\n            plt.subplot(len(sample_idxs), 3, i*3+2)\n            plt.imshow(mask[0].cpu().numpy(), cmap='gray')\n            plt.title(\"True Mask\")\n            plt.axis(\"off\")\n            plt.subplot(len(sample_idxs), 3, i*3+3)\n            plt.imshow(showimg, cmap='gray')\n            plt.imshow(pred_mask, cmap='Reds', alpha=0.5)\n            plt.title(\"Predicted Overlay\")\n            plt.axis(\"off\")\n    plt.tight_layout()\n    plt.show()",
                "plan": "1. **Reproducibility**: The code sets all relevant random seeds.\n2. **Dataset Parsing and Preprocessing**\n    - Uses a robust custom Dataset class that finds all .tif files in `images/`, pairs them with corresponding `_mask.tif` files, and drops non-existing pairs.\n    - Loads and resizes images/masks, with normalization and data augmentations during training.\n    - Returns data as torch.float32 tensors suitable for input to a PyTorch CNN.\n3. **U-Net Model**\n    - Implements a standard encoder-decoder U-Net architecture including skip connections, batch norm, and ReLU.\n    - Outputs a probability mask via sigmoid.\n4. **Training and Validation**\n    - Uses BCE loss for segmentation.\n    - Training loop performs forward, backward, and optimizer steps per batch.\n    - Validation computes loss and Dice.\n    - Includes robust checks for dataset emptiness to avoid zero-length DataLoader errors.\n    - Automatically restores the best model (by validation Dice score) and leverages patience for early stopping.\n5. **Evaluation**\n    - Separately evaluates per-image Dice on the test set.\n6. **Visualization**\n    - The plotting function visualizes random predictions from the test set: shows input, true mask, and predicted overlay.\n7. **Main Integration**\n    - Calling `main()` triggers the entire workflow: dataset loading, model training, evaluation, and returns the trained model and test Dice score.\n    - Plotting is separated, to be called after training as needed.",
                "main_function_name": "main",
                "score": 0.12882052857067305,
                "pass_rate": 0.0,
                "pass_rate_score": 0.0,
                "prediction_score": 0.0,
                "pylint_score": 0.849,
                "radon_score": 0.43920528570673056,
                "test_case_results": {
                    "runnability_check": {
                        "success": false,
                        "reason": "test_failed",
                        "message": "code is not runnable, error: Traceback (most recent call last):\n  File \"<string>\", line 4, in test_function\n  File \"<string>\", line 249, in main\n  File \"<string>\", line 155, in train_one_epoch\n  File \"d:\\anaconda3\\envs\\llm\\lib\\site-packages\\torch\\utils\\data\\dataloader.py\", line 439, in __iter__\n    return self._get_iterator()\n  File \"d:\\anaconda3\\envs\\llm\\lib\\site-packages\\torch\\utils\\data\\dataloader.py\", line 387, in _get_iterator\n    return _MultiProcessingDataLoaderIter(self)\n  File \"d:\\anaconda3\\envs\\llm\\lib\\site-packages\\torch\\utils\\data\\dataloader.py\", line 1040, in __init__\n    w.start()\n  File \"d:\\anaconda3\\envs\\llm\\lib\\multiprocessing\\process.py\", line 121, in start\n    self._popen = self._Popen(self)\n  File \"d:\\anaconda3\\envs\\llm\\lib\\multiprocessing\\context.py\", line 224, in _Popen\n    return _default_context.get_context().Process._Popen(process_obj)\n  File \"d:\\anaconda3\\envs\\llm\\lib\\multiprocessing\\context.py\", line 327, in _Popen\n    return Popen(process_obj)\n  File \"d:\\anaconda3\\envs\\llm\\lib\\multiprocessing\\popen_spawn_win32.py\", line 93, in __init__\n    reduction.dump(process_obj, to_child)\n  File \"d:\\anaconda3\\envs\\llm\\lib\\multiprocessing\\reduction.py\", line 60, in dump\n    ForkingPickler(file, protocol).dump(obj)\n_pickle.PicklingError: Can't pickle <class 'MRISegmentationDataset'>: attribute lookup MRISegmentationDataset on builtins failed\n"
                    }
                },
                "test_weights": {
                    "runnability_check": 0.001
                }
            }
        },
        "4": {
            "code_0": {
                "code": "import os\nimport random\nimport numpy as np\nfrom glob import glob\nfrom PIL import Image\nimport torch\nfrom torch import nn\nfrom torch.utils.data import Dataset, DataLoader\nimport torch.nn.functional as F\nimport matplotlib.pyplot as plt\n\n# =============================\n# Utility: Seed Setup\ndef set_seed(seed=42):\n    \"\"\"\n    Set random seeds for reproducible results.\n    \"\"\"\n    random.seed(seed)\n    np.random.seed(seed)\n    torch.manual_seed(seed)\n    torch.cuda.manual_seed_all(seed)\n    torch.backends.cudnn.deterministic = True\n    torch.backends.cudnn.benchmark = False\n\n# =============================\n# Dataset Definition\nclass MRISegmentationDataset(Dataset):\n    \"\"\"\n    PyTorch Dataset for paired MRI images and segmentation masks.\n    \"\"\"\n    def __init__(self, images_dir, masks_dir, augment=False, image_size=(256,256)):\n        self.images_dir = images_dir\n        self.masks_dir = masks_dir\n        self.image_size = image_size\n        self.augment = augment\n\n        # Gather image and mask file pairs\n        self.image_paths = sorted(glob(os.path.join(self.images_dir, '*.tif')))\n        self.mask_paths = []\n        for img_path in self.image_paths:\n            img_base = os.path.basename(img_path).replace('.tif', '')\n            mask_path = os.path.join(self.masks_dir, img_base + '_mask.tif')\n            if os.path.exists(mask_path):\n                self.mask_paths.append(mask_path)\n            else:\n                self.mask_paths.append(None)\n        # Only keep pairs with both files\n        pairs = [(img, mask) for img, mask in zip(self.image_paths, self.mask_paths) if mask is not None]\n        self.image_paths = [p[0] for p in pairs]\n        self.mask_paths = [p[1] for p in pairs]\n\n    def __len__(self):\n        return len(self.image_paths)\n\n    def __getitem__(self, idx):\n        # --- Load image and mask files\n        img = Image.open(self.image_paths[idx]).convert('RGB')\n        mask = Image.open(self.mask_paths[idx]).convert('L') # Ensure single-channel\n\n        # --- Resize to fixed size for model input\n        img = img.resize(self.image_size, resample=Image.BILINEAR)\n        mask = mask.resize(self.image_size, resample=Image.NEAREST)\n\n        # --- Convert to numpy arrays\n        img = np.array(img).astype(np.float32) # [H,W,3]\n        mask = np.array(mask).astype(np.float32) # [H,W]\n        mask = (mask > 127).astype(np.float32) # threshold, create binary mask\n\n        # --- Normalize image [0,1] per-slice\n        minv, maxv = img.min(), img.max()\n        if maxv - minv > 0:\n            img = (img - minv) / (maxv - minv)\n        else:\n            img = img * 0. # All black if degenerate\n\n        # --- Data augmentation (applied on both image & mask)\n        if self.augment:\n            # Random horizontal flip\n            if random.random() < 0.5:\n                img = np.fliplr(img)\n                mask = np.fliplr(mask)\n            # Random vertical flip\n            if random.random() < 0.5:\n                img = np.flipud(img)\n                mask = np.flipud(mask)\n            # Random rotation (0, 90, 180, 270)\n            if random.random() < 0.5:\n                k = random.choice([1,2,3])\n                img = np.rot90(img, k)\n                mask = np.rot90(mask, k)\n            # Random brightness scaling\n            if random.random() < 0.5:\n                fac = 0.85 + 0.3 * random.random()\n                img = np.clip(img * fac, 0, 1)\n\n        # --- Convert to channel-first Torch tensors\n        img = torch.from_numpy(img.transpose(2, 0, 1)).float() # [3,H,W]\n        mask = torch.from_numpy(mask).float().unsqueeze(0)      # [1,H,W]\n        return img, mask\n\n# =============================\n# U-Net Building Blocks\nclass DoubleConv(nn.Module):\n    \"\"\"\n    Two sequential convolutional layers each with BN and ReLU.\n    \"\"\"\n    def __init__(self, in_channels, out_channels):\n        super().__init__()\n        self.seq = nn.Sequential(\n            nn.Conv2d(in_channels, out_channels, 3, padding=1, bias=False),\n            nn.BatchNorm2d(out_channels),\n            nn.ReLU(inplace=True),\n            nn.Conv2d(out_channels, out_channels, 3, padding=1, bias=False),\n            nn.BatchNorm2d(out_channels),\n            nn.ReLU(inplace=True)\n        )\n    def forward(self, x):\n        return self.seq(x)\n\nclass UNet(nn.Module):\n    \"\"\"\n    Standard U-Net for image segmentation.\n    \"\"\"\n    def __init__(self, in_channels=3, out_channels=1, features=[64,128,256,512]):\n        super().__init__()\n        self.downs = nn.ModuleList()\n        self.ups = nn.ModuleList()\n        ch = in_channels\n        # Contracting path (encoders)\n        for f in features:\n            self.downs.append(DoubleConv(ch, f))\n            ch = f\n        self.pool = nn.MaxPool2d(2)\n        # Bottleneck\n        self.bottleneck = DoubleConv(features[-1], features[-1]*2)\n        # Expanding path (decoders)\n        rev_feats = list(reversed(features))\n        ch = features[-1]*2\n        for f in rev_feats:\n            self.ups.append(nn.ConvTranspose2d(ch, f, kernel_size=2, stride=2))\n            self.ups.append(DoubleConv(f*2, f))\n            ch = f\n        self.final = nn.Conv2d(features[0], out_channels, kernel_size=1) # 1x1 conv for seg-map\n\n    def forward(self, x):\n        skips = []\n        for down in self.downs:\n            x = down(x)\n            skips.append(x)\n            x = self.pool(x)\n        x = self.bottleneck(x)\n        skips = skips[::-1]\n        for idx in range(0, len(self.ups), 2):\n            x = self.ups[idx](x)\n            skip = skips[idx//2]\n            # If shape mismatch due to downsampling rounding, interpolate\n            if x.shape[-2:] != skip.shape[-2:]:\n                x = F.interpolate(x, size=skip.shape[-2:], mode=\"bilinear\", align_corners=False)\n            x = torch.cat([skip, x], dim=1)\n            x = self.ups[idx+1](x)\n        x = self.final(x)\n        return torch.sigmoid(x) # For BCE loss; applies sigmoid\n\n# =============================\n# Dice Coefficient (batchwise)\ndef dice_coefficient(pred, target, threshold=0.5, eps=1e-7):\n    \"\"\"\n    Compute Dice coefficient between predicted and target masks.\n    Both pred, target: (N, 1, H, W)\n    \"\"\"\n    pred = (pred > threshold).float()\n    target = (target > threshold).float()\n    intersection = (pred * target).sum(dim=(2,3))\n    union = pred.sum(dim=(2,3)) + target.sum(dim=(2,3))\n    dice = (2.0 * intersection + eps) / (union + eps)\n    return dice.mean().item()\n\n# =============================\n# Training Loop (one epoch)\ndef train_one_epoch(model, loader, criterion, optimizer, device):\n    model.train()\n    running_loss = 0.0\n    num_samples = 0\n    for imgs, masks in loader:\n        imgs = imgs.to(device)\n        masks = masks.to(device)\n        optimizer.zero_grad()\n        preds = model(imgs)\n        loss = criterion(preds, masks)\n        loss.backward()\n        optimizer.step()\n        running_loss += loss.item() * imgs.size(0)\n        num_samples += imgs.size(0)\n    avg_loss = running_loss / (num_samples + 1e-8)\n    return avg_loss\n\n# =============================\n# Validation/Evaluation Loop\ndef eval_epoch(model, loader, criterion, device):\n    model.eval()\n    running_loss = 0.0\n    dices = []\n    num_samples = 0\n    with torch.no_grad():\n        for imgs, masks in loader:\n            imgs = imgs.to(device)\n            masks = masks.to(device)\n            preds = model(imgs)\n            loss = criterion(preds, masks)\n            running_loss += loss.item() * imgs.size(0)\n            dices.append(dice_coefficient(preds.cpu(), masks.cpu()))\n            num_samples += imgs.size(0)\n    avg_loss = running_loss / (num_samples + 1e-8)\n    mean_dice = np.mean(dices) if len(dices) > 0 else 0.0\n    return avg_loss, mean_dice\n\n# =============================\n# Test Evaluation (only Dice)\ndef test_eval(model, loader, device):\n    model.eval()\n    dices = []\n    with torch.no_grad():\n        for imgs, masks in loader:\n            imgs = imgs.to(device)\n            masks = masks.to(device)\n            preds = model(imgs)\n            dices.append(dice_coefficient(preds.cpu(), masks.cpu()))\n    return np.mean(dices) if dices else 0.0\n\n# =============================\ndef main():\n    \"\"\"\n    Main function to load data, train U-Net, evaluate on test set, and return model and test Dice.\n    Returns:\n        model : trained torch.nn.Module (U-Net)\n        test_dice : float (mean Dice on test set)\n    \"\"\"\n    set_seed(42)\n    # Dataset base path (use provided Windows-style path)\n    base_path = r\"E:\\python_project_new\\brain_case_study\\lgg-mri-segmentation\\case_study\"\n    # All directory paths\n    train_img_dir = os.path.join(base_path, 'train', 'images')\n    train_mask_dir = os.path.join(base_path, 'train', 'masks')\n    val_img_dir = os.path.join(base_path, 'val', 'images')\n    val_mask_dir = os.path.join(base_path, 'val', 'masks')\n    test_img_dir = os.path.join(base_path, 'test', 'images')\n    test_mask_dir = os.path.join(base_path, 'test', 'masks')\n\n    # Hyperparameters\n    image_size = (256,256)\n    batch_size = 8\n    lr = 1e-3\n    epochs = 25\n    patience = 5\n\n    device = torch.device('cuda' if torch.cuda.is_available() else 'cpu')\n\n    # --- Datasets\n    train_ds = MRISegmentationDataset(train_img_dir, train_mask_dir, augment=True, image_size=image_size)\n    val_ds = MRISegmentationDataset(val_img_dir, val_mask_dir, augment=False, image_size=image_size)\n    test_ds = MRISegmentationDataset(test_img_dir, test_mask_dir, augment=False, image_size=image_size)\n\n    # --- Empty dataset checks\n    if len(train_ds) == 0:\n        raise RuntimeError(f\"No training images found at {train_img_dir}\")\n    if len(val_ds) == 0:\n        raise RuntimeError(f\"No validation images found at {val_img_dir}\")\n    if len(test_ds) == 0:\n        raise RuntimeError(f\"No test images found at {test_img_dir}\")\n\n    # --- DataLoaders (num_workers=0 to avoid pickling issues on some systems)\n    train_loader = DataLoader(train_ds, batch_size=batch_size, shuffle=True, num_workers=0, pin_memory=False)\n    val_loader = DataLoader(val_ds, batch_size=batch_size, shuffle=False, num_workers=0, pin_memory=False)\n    test_loader = DataLoader(test_ds, batch_size=1, shuffle=False, num_workers=0)\n\n    # --- Model, Loss, Optimizer\n    model = UNet(in_channels=3, out_channels=1).to(device)\n    criterion = nn.BCELoss()\n    optimizer = torch.optim.Adam(model.parameters(), lr=lr)\n\n    # --- Early stopping tracking\n    best_val_dice = 0.0\n    best_epoch = -1\n    best_weights = None\n    epochs_no_improve = 0\n\n    for epoch in range(epochs):\n        train_loss = train_one_epoch(model, train_loader, criterion, optimizer, device)\n        val_loss, val_dice = eval_epoch(model, val_loader, criterion, device)\n        # Save model if validation Dice improves\n        if val_dice > best_val_dice:\n            best_val_dice = val_dice\n            best_epoch = epoch\n            best_weights = model.state_dict()\n            epochs_no_improve = 0\n        else:\n            epochs_no_improve += 1\n        # Early stop after patience epochs with no improvement\n        if epochs_no_improve >= patience:\n            break\n\n    # Restore model to best validation Dice\n    if best_weights is not None:\n        model.load_state_dict(best_weights)\n\n    # --- Test evaluation\n    test_dice = test_eval(model, test_loader, device)\n\n    return model, test_dice\n\n# =============================\ndef plot_predictions(model, num_samples=4):\n    \"\"\"\n    Function to plot predictions from the test set.\n    Args:\n        model: trained segmentation model\n        num_samples: number of sample images to show\n    \"\"\"\n    base_path = r\"E:\\python_project_new\\brain_case_study\\lgg-mri-segmentation\\case_study\"\n    test_img_dir = os.path.join(base_path, 'test', 'images')\n    test_mask_dir = os.path.join(base_path, 'test', 'masks')\n    image_size = (256,256)\n    test_ds = MRISegmentationDataset(test_img_dir, test_mask_dir, augment=False, image_size=image_size)\n    if len(test_ds) == 0:\n        raise RuntimeError(f\"No test data available for plotting in {test_img_dir}\")\n\n    # Randomly select unique indices\n    idxs = np.random.choice(len(test_ds), min(num_samples, len(test_ds)), replace=False)\n    device = next(model.parameters()).device\n    model.eval()\n    plt.figure(figsize=(12, 4*len(idxs)))\n    with torch.no_grad():\n        for i, idx in enumerate(idxs):\n            img, mask = test_ds[idx]\n            show_img = img.permute(1,2,0).cpu().numpy()  # [H,W,3], already normalized\n            mask_np = mask[0].cpu().numpy()\n            pred = model(img.unsqueeze(0).to(device))\n            pred_mask = (pred[0,0].cpu().numpy() > 0.5).astype(np.uint8)\n            # Display Input, GT, Prediction\n            plt.subplot(len(idxs), 3, i*3+1)\n            plt.imshow(show_img, cmap='gray')\n            plt.title(\"Input Image\")\n            plt.axis(\"off\")\n            plt.subplot(len(idxs), 3, i*3+2)\n            plt.imshow(mask_np, cmap='gray')\n            plt.title(\"Ground Truth Mask\")\n            plt.axis(\"off\")\n            plt.subplot(len(idxs), 3, i*3+3)\n            plt.imshow(show_img, cmap='gray')\n            plt.imshow(pred_mask, cmap='Reds', alpha=0.5)\n            plt.title(\"Predicted Overlay\")\n            plt.axis(\"off\")\n    plt.tight_layout()\n    plt.show()",
                "plan": "1. **Import libraries & set seeds:**  \n   Ensure reproducibility and correct library imports.\n\n2. **Dataset definition:**  \n   Define `MRISegmentationDataset` at module level to avoid pickling errors with DataLoader. It loads (and pairs) 2D image and mask files, preprocessing and augmenting as needed.\n\n3. **U-Net model construction:**  \n   Implement `UNet` and `DoubleConv` modules. The architecture uses downsampling encoders, a bottleneck, and upsampling decoders with skip connections; outputs probability masks via sigmoid.\n\n4. **Metric & training logic:**  \n   Dice coefficient is implemented for batchwise evaluation. Training, validation, and test loops are modular for clarity.\n\n5. **Main function (main):**  \n   - Loads train, val, test splits as datasets (checking all directories exist and are not empty).\n   - Builds DataLoaders (with `num_workers=0` for full portability).\n   - Initializes UNet, loss, optimizer.\n   - Trains with early stopping on validation Dice (patience parameter), always retaining best model weights.\n   - Evaluates the restored best model on the test set.\n   - Returns model and test Dice score.\n\n6. **Visualization:**  \n   A plotting function `plot_predictions(model, num_samples=4)` which visualizes test images with their true and predicted masks overlayed for qualitative assessment.\n\n7. **Integration:**  \n   All definitions are at the module/top-level (no local classes/functions) to ensure full compatibility with torch’s DataLoader and multiprocessing, even if used in console, scripts, or testing/test-harness frameworks.",
                "main_function_name": "main",
                "score": 0.13530359307340495,
                "pass_rate": 0.0,
                "pass_rate_score": 0.0,
                "prediction_score": 0.0,
                "pylint_score": 0.874,
                "radon_score": 0.4790359307340495,
                "test_case_results": {
                    "runnability_check": {
                        "success": false,
                        "reason": "test_failed",
                        "message": "code is not runnable, error: Traceback (most recent call last):\n  File \"<string>\", line 4, in test_function\n  File \"<string>\", line 288, in main\n  File \"<string>\", line 184, in train_one_epoch\n  File \"d:\\anaconda3\\envs\\llm\\lib\\site-packages\\torch\\utils\\data\\dataloader.py\", line 631, in __next__\n    data = self._next_data()\n  File \"d:\\anaconda3\\envs\\llm\\lib\\site-packages\\torch\\utils\\data\\dataloader.py\", line 675, in _next_data\n    data = self._dataset_fetcher.fetch(index)  # may raise StopIteration\n  File \"d:\\anaconda3\\envs\\llm\\lib\\site-packages\\torch\\utils\\data\\_utils\\fetch.py\", line 51, in fetch\n    data = [self.dataset[idx] for idx in possibly_batched_index]\n  File \"d:\\anaconda3\\envs\\llm\\lib\\site-packages\\torch\\utils\\data\\_utils\\fetch.py\", line 51, in <listcomp>\n    data = [self.dataset[idx] for idx in possibly_batched_index]\n  File \"<string>\", line 98, in __getitem__\nValueError: At least one stride in the given numpy array is negative, and tensors with negative strides are not currently supported. (You can probably work around this by making a copy of your array  with array.copy().) \n"
                    }
                },
                "test_weights": {
                    "runnability_check": 0.001
                }
            }
        }
    }
]