data_dir: !!python/object/apply:pathlib.PosixPath
- /
- projects
- 
- users
- 
- tusoml
- openproblems_datasets
- aide_denoise
desc_file: null
goal: Build a method for single cell RNA-seq imputation. Create adata.obsm['denoised']
  from adata.obsm['train'], and compare against adata.obsm['test'].
eval: "Use this exact function for evaluation. Lower is better.\ndef mse(adata):\n\
  \    import anndata\n    import scanpy as sc\n    import scprep\n    import sklearn.metrics\n\
  \n    test_data = anndata.AnnData(X=adata.obsm[\\\"test\\\"], obs=adata.obs, var=adata.var)\n\
  \    denoised_data = anndata.AnnData(\n        X=adata.obsm[\\\"denoised\\\"], obs=adata.obs,\
  \ var=adata.var\n    )\n\n    # scaling and transformation\n    target_sum = 10000\n\
  \n    sc.pp.normalize_total(test_data, target_sum=target_sum)\n    sc.pp.log1p(test_data)\n\
  \n    sc.pp.normalize_total(denoised_data, target_sum=target_sum)\n    sc.pp.log1p(denoised_data)\n\
  \n    error = sklearn.metrics.mean_squared_error(\n        scprep.utils.toarray(test_data.X),\
  \ denoised_data.X\n    )\n    return error\n"
log_dir: !!python/object/apply:pathlib.PosixPath
- /
- projects
- 
- users
- 
- tusoml
- logs
- 0-huge-elephant-from-saturn
workspace_dir: !!python/object/apply:pathlib.PosixPath
- /
- projects
- 
- users
- 
- tusoml
- workspaces
- 0-huge-elephant-from-saturn
preprocess_data: true
copy_data: true
exp_name: 0-huge-elephant-from-saturn
exec:
  timeout: 3600
  agent_file_name: runfile.py
  format_tb_ipython: false
generate_report: true
report:
  model: gpt-4-turbo
  temp: 1.0
agent:
  steps: 20
  k_fold_validation: 5
  expose_prediction: false
  data_preview: true
  code:
    model: gpt-4o-mini
    temp: 0.5
  feedback:
    model: gpt-4-turbo
    temp: 0.5
  search:
    max_debug_depth: 3
    debug_prob: 0.5
    num_drafts: 5
