<?xml version="1.0" encoding="UTF-8"?>
<project version="4">
  <component name="AutoImportSettings">
    <option name="autoReloadType" value="SELECTIVE" />
  </component>
  <component name="ChangeListManager">
    <list default="true" id="b4c59053-994a-48ba-a980-ef0b979ffc77" name="更改" comment="">
      <change beforePath="$PROJECT_DIR$/.gemini/config.yaml" beforeDir="false" />
      <change beforePath="$PROJECT_DIR$/.github/CODEOWNERS" beforeDir="false" />
      <change beforePath="$PROJECT_DIR$/.github/PULL_REQUEST_TEMPLATE.md" beforeDir="false" />
      <change beforePath="$PROJECT_DIR$/.github/dependabot.yml" beforeDir="false" />
      <change beforePath="$PROJECT_DIR$/.github/workflows/check-pr-title.yml" beforeDir="false" />
      <change beforePath="$PROJECT_DIR$/.github/workflows/checkpoint_converter.yml" beforeDir="false" />
      <change beforePath="$PROJECT_DIR$/.github/workflows/cpu_unit_tests.yml" beforeDir="false" />
      <change beforePath="$PROJECT_DIR$/.github/workflows/disabled/e2e_prime.yml" beforeDir="false" />
      <change beforePath="$PROJECT_DIR$/.github/workflows/doc.yml" beforeDir="false" />
      <change beforePath="$PROJECT_DIR$/.github/workflows/e2e_ascend.yml" beforeDir="false" />
      <change beforePath="$PROJECT_DIR$/.github/workflows/e2e_dapo.yml" beforeDir="false" />
      <change beforePath="$PROJECT_DIR$/.github/workflows/e2e_eval_aime24.yml" beforeDir="false" />
      <change beforePath="$PROJECT_DIR$/.github/workflows/e2e_genrm_remote.yml" beforeDir="false" />
      <change beforePath="$PROJECT_DIR$/.github/workflows/e2e_ppo_trainer.yml" beforeDir="false" />
      <change beforePath="$PROJECT_DIR$/.github/workflows/e2e_ppo_trainer_megatron_sglang.yml" beforeDir="false" />
      <change beforePath="$PROJECT_DIR$/.github/workflows/e2e_ppo_trainer_megatron_vllm.yml" beforeDir="false" />
      <change beforePath="$PROJECT_DIR$/.github/workflows/e2e_sft.yml" beforeDir="false" />
      <change beforePath="$PROJECT_DIR$/.github/workflows/e2e_spin.yml" beforeDir="false" />
      <change beforePath="$PROJECT_DIR$/.github/workflows/e2e_sppo.yml" beforeDir="false" />
      <change beforePath="$PROJECT_DIR$/.github/workflows/gpu_unit_tests.yml" beforeDir="false" />
      <change beforePath="$PROJECT_DIR$/.github/workflows/model.yml" beforeDir="false" />
      <change beforePath="$PROJECT_DIR$/.github/workflows/pre-commit-full.yml" beforeDir="false" />
      <change beforePath="$PROJECT_DIR$/.github/workflows/pre-commit.yml" beforeDir="false" />
      <change beforePath="$PROJECT_DIR$/.github/workflows/sanity.yml" beforeDir="false" />
      <change beforePath="$PROJECT_DIR$/.github/workflows/scorecard.yml" beforeDir="false" />
      <change beforePath="$PROJECT_DIR$/.github/workflows/secrets_scan.yml" beforeDir="false" />
      <change beforePath="$PROJECT_DIR$/.github/workflows/sgl.yml" beforeDir="false" />
      <change beforePath="$PROJECT_DIR$/.github/workflows/type-coverage-check.yml" beforeDir="false" />
      <change beforePath="$PROJECT_DIR$/.github/workflows/vllm.yml" beforeDir="false" />
      <change beforePath="$PROJECT_DIR$/.vscode/settings.json" beforeDir="false" />
      <change beforePath="$PROJECT_DIR$/examples/data_preprocess/gsm8k.py" beforeDir="false" afterPath="$PROJECT_DIR$/examples/data_preprocess/gsm8k.py" afterDir="false" />
      <change beforePath="$PROJECT_DIR$/examples/data_preprocess/math_dataset.py" beforeDir="false" afterPath="$PROJECT_DIR$/examples/data_preprocess/math_dataset.py" afterDir="false" />
      <change beforePath="$PROJECT_DIR$/scripts/install_vllm_sglang_mcore.sh" beforeDir="false" afterPath="$PROJECT_DIR$/scripts/install_vllm_sglang_mcore.sh" afterDir="false" />
      <change beforePath="$PROJECT_DIR$/verl/model_merger/base_model_merger.py" beforeDir="false" afterPath="$PROJECT_DIR$/verl/model_merger/base_model_merger.py" afterDir="false" />
      <change beforePath="$PROJECT_DIR$/verl/trainer/main_eval.py" beforeDir="false" afterPath="$PROJECT_DIR$/verl/trainer/main_eval.py" afterDir="false" />
      <change beforePath="$PROJECT_DIR$/verl/trainer/main_generation.py" beforeDir="false" afterPath="$PROJECT_DIR$/verl/trainer/main_generation.py" afterDir="false" />
      <change beforePath="$PROJECT_DIR$/verl/trainer/main_ppo.py" beforeDir="false" afterPath="$PROJECT_DIR$/verl/trainer/main_ppo.py" afterDir="false" />
      <change beforePath="$PROJECT_DIR$/verl/trainer/ppo/metric_utils.py" beforeDir="false" afterPath="$PROJECT_DIR$/verl/trainer/ppo/metric_utils.py" afterDir="false" />
      <change beforePath="$PROJECT_DIR$/verl/trainer/ppo/ray_trainer.py" beforeDir="false" afterPath="$PROJECT_DIR$/verl/trainer/ppo/ray_trainer.py" afterDir="false" />
      <change beforePath="$PROJECT_DIR$/verl/trainer/ppo/reward.py" beforeDir="false" afterPath="$PROJECT_DIR$/verl/trainer/ppo/reward.py" afterDir="false" />
      <change beforePath="$PROJECT_DIR$/verl/workers/fsdp_workers.py" beforeDir="false" afterPath="$PROJECT_DIR$/verl/workers/fsdp_workers.py" afterDir="false" />
      <change beforePath="$PROJECT_DIR$/verl/workers/reward_manager/__init__.py" beforeDir="false" afterPath="$PROJECT_DIR$/verl/workers/reward_manager/__init__.py" afterDir="false" />
    </list>
    <option name="SHOW_DIALOG" value="false" />
    <option name="HIGHLIGHT_CONFLICTS" value="true" />
    <option name="HIGHLIGHT_NON_ACTIVE_CHANGELIST" value="false" />
    <option name="LAST_RESOLUTION" value="IGNORE" />
  </component>
  <component name="FileTemplateManagerImpl">
    <option name="RECENT_TEMPLATES">
      <list>
        <option value="Python Script" />
      </list>
    </option>
  </component>
  <component name="FlaskConsoleOptions" custom-start-script="import sys; print('Python %s on %s' % (sys.version, sys.platform)); sys.path.extend([WORKING_DIR_AND_PYTHON_PATHS])&#10;from flask.cli import ScriptInfo, NoAppException&#10;for module in [&quot;main.py&quot;, &quot;wsgi.py&quot;, &quot;app.py&quot;]:&#10;    try: locals().update(ScriptInfo(app_import_path=module, create_app=None).load_app().make_shell_context()); print(&quot;\nFlask App: %s&quot; % app.import_name); break&#10;    except NoAppException: pass">
    <envs>
      <env key="FLASK_APP" value="app" />
    </envs>
    <option name="myCustomStartScript" value="import sys; print('Python %s on %s' % (sys.version, sys.platform)); sys.path.extend([WORKING_DIR_AND_PYTHON_PATHS])&#10;from flask.cli import ScriptInfo, NoAppException&#10;for module in [&quot;main.py&quot;, &quot;wsgi.py&quot;, &quot;app.py&quot;]:&#10;    try: locals().update(ScriptInfo(app_import_path=module, create_app=None).load_app().make_shell_context()); print(&quot;\nFlask App: %s&quot; % app.import_name); break&#10;    except NoAppException: pass" />
    <option name="myEnvs">
      <map>
        <entry key="FLASK_APP" value="app" />
      </map>
    </option>
  </component>
  <component name="Git.Settings">
    <option name="RECENT_GIT_ROOT_PATH" value="$PROJECT_DIR$" />
  </component>
  <component name="HighlightingSettingsPerFile">
    <setting file="file://$USER_HOME$/anaconda3/envs/verl/lib/python3.10/site-packages/hydra/core/override_parser/overrides_parser.py" root0="SKIP_INSPECTION" />
    <setting file="file://$USER_HOME$/anaconda3/envs/verl/lib/python3.10/site-packages/ray/_private/worker.py" root0="SKIP_INSPECTION" />
  </component>
  <component name="ProjectColorInfo">{
  &quot;associatedIndex&quot;: 7
}</component>
  <component name="ProjectId" id="2zVciaIRmQ8cjkStpgrVGj5CgKf" />
  <component name="ProjectViewState">
    <option name="hideEmptyMiddlePackages" value="true" />
    <option name="showLibraryContents" value="true" />
  </component>
  <component name="PropertiesComponent"><![CDATA[{
  "keyToString": {
    "Python 调试服务器.TaskRunner.executor": "Debug",
    "Python 调试服务器.generation.executor": "Debug",
    "Python.111.executor": "Run",
    "Python.222.executor": "Run",
    "Python.AIME2024.executor": "Run",
    "Python.AIME2025.executor": "Run",
    "Python.amc23.executor": "Run",
    "Python.cal_length.executor": "Debug",
    "Python.cal_length_feo.executor": "Run",
    "Python.correct_length2.executor": "Run",
    "Python.data_download.executor": "Run",
    "Python.gsm8k.executor": "Run",
    "Python.lora_merge.executor": "Run",
    "Python.main_eval.executor": "Run",
    "Python.main_generation.executor": "Run",
    "Python.main_ppo.executor": "Run",
    "Python.main_ppo2.executor": "Run",
    "Python.math500.executor": "Run",
    "Python.model_download.executor": "Run",
    "RunOnceActivity.ShowReadmeOnStart": "true",
    "RunOnceActivity.TerminalTabsStorage.copyFrom.TerminalArrangementManager.252": "true",
    "RunOnceActivity.git.unshallow": "true",
    "Shell Script.eval_for.sh.executor": "Run",
    "Shell Script.pt2hf.sh.executor": "Run",
    "Shell Script.未命名.executor": "Debug",
    "git-widget-placeholder": "main",
    "last_opened_file_path": "/Users/yinshengpeng/Documents/research/iclr2026/verl",
    "node.js.detected.package.eslint": "true",
    "node.js.detected.package.tslint": "true",
    "node.js.selected.package.eslint": "(autodetect)",
    "node.js.selected.package.tslint": "(autodetect)",
    "nodejs_package_manager_path": "npm",
    "vue.rearranger.settings.migration": "true"
  }
}]]></component>
  <component name="RdControllerToolWindowsLayoutState" isNewUi="true">
    <layout>
      <window_info id="Bookmarks" side_tool="true" />
      <window_info id="Merge Requests" show_stripe_button="false" />
      <window_info id="Backup and Sync History" />
      <window_info id="Commit_Guest" show_stripe_button="false" />
      <window_info id="Pull Requests" />
      <window_info id="Learn" show_stripe_button="false" />
      <window_info active="true" content_ui="combo" id="Project" order="0" visible="true" weight="0.35392857" />
      <window_info id="Commit" order="1" weight="0.25" />
      <window_info id="Structure" order="2" side_tool="true" weight="0.25" />
      <window_info anchor="bottom" id="Database Changes" />
      <window_info anchor="bottom" id="TypeScript" show_stripe_button="false" />
      <window_info anchor="bottom" id="TODO" />
      <window_info anchor="bottom" id="HfCacheToolWindow" show_stripe_button="false" />
      <window_info anchor="bottom" id="File Transfer" show_stripe_button="false" />
      <window_info anchor="bottom" id="Version Control" order="1" />
      <window_info anchor="bottom" id="Problems" order="2" />
      <window_info anchor="bottom" id="Problems View" order="3" />
      <window_info anchor="bottom" id="Services" order="4" />
      <window_info anchor="bottom" id="Python Packages" order="6" weight="0.1" />
      <window_info anchor="bottom" id="Python Console" order="7" weight="0.48935187" />
      <window_info anchor="bottom" id="Debug" order="8" weight="0.2951515" />
      <window_info anchor="bottom" id="Find" order="10" weight="0.43935186" />
      <window_info active="true" anchor="bottom" id="Terminal" order="11" sideWeight="0.49962008" visible="true" weight="0.41030303" />
      <window_info anchor="bottom" id="Run" order="12" sideWeight="0.5003799" weight="0.41272727" />
      <window_info anchor="right" id="Endpoints" show_stripe_button="false" />
      <window_info anchor="right" id="Coverage" show_stripe_button="false" side_tool="true" />
      <window_info anchor="right" id="Jupyter Variables" side_tool="true" />
      <window_info anchor="right" content_ui="combo" id="Notifications" order="0" weight="0.25" />
      <window_info anchor="right" id="AIAssistant" order="1" weight="0.25" />
      <window_info anchor="right" id="Database" order="2" weight="0.25" />
      <window_info anchor="right" id="Gradle" order="3" weight="0.25" />
      <window_info anchor="right" id="Maven" order="4" weight="0.25" />
      <window_info anchor="right" id="Plots" order="5" weight="0.1" />
      <window_info anchor="right" id="SciView" order="6" weight="0.6432143" />
    </layout>
  </component>
  <component name="RunManager" selected="Python.main_eval">
    <configuration name="TaskRunner" type="PyRemoteDebugConfigurationType" factoryName="Python Remote Debug">
      <module name="verl" />
      <option name="PORT" value="10087" />
      <option name="HOST" value="localhost" />
      <PathMappingSettings>
        <option name="pathMappings">
          <list />
        </option>
      </PathMappingSettings>
      <option name="REDIRECT_OUTPUT" value="true" />
      <option name="SUSPEND_AFTER_CONNECT" value="true" />
      <method v="2" />
    </configuration>
    <configuration name="generation" type="PyRemoteDebugConfigurationType" factoryName="Python Remote Debug">
      <module name="verl" />
      <option name="PORT" value="10088" />
      <option name="HOST" value="localhost" />
      <PathMappingSettings>
        <option name="pathMappings">
          <list />
        </option>
      </PathMappingSettings>
      <option name="REDIRECT_OUTPUT" value="true" />
      <option name="SUSPEND_AFTER_CONNECT" value="true" />
      <method v="2" />
    </configuration>
    <configuration name="amc23" type="PythonConfigurationType" factoryName="Python" temporary="true" nameIsGenerated="true">
      <module name="verl" />
      <option name="ENV_FILES" value="" />
      <option name="INTERPRETER_OPTIONS" value="" />
      <option name="PARENT_ENVS" value="true" />
      <envs>
        <env name="PYTHONUNBUFFERED" value="1" />
      </envs>
      <option name="SDK_HOME" value="" />
      <option name="WORKING_DIRECTORY" value="$PROJECT_DIR$/examples/data_preprocess" />
      <option name="IS_MODULE_SDK" value="true" />
      <option name="ADD_CONTENT_ROOTS" value="true" />
      <option name="ADD_SOURCE_ROOTS" value="true" />
      <EXTENSION ID="PythonCoverageRunConfigurationExtension" runner="coverage.py" />
      <option name="SCRIPT_NAME" value="$PROJECT_DIR$/examples/data_preprocess/amc23.py" />
      <option name="PARAMETERS" value="" />
      <option name="SHOW_COMMAND_LINE" value="false" />
      <option name="EMULATE_TERMINAL" value="false" />
      <option name="MODULE_MODE" value="false" />
      <option name="REDIRECT_INPUT" value="false" />
      <option name="INPUT_FILE" value="" />
      <method v="2" />
    </configuration>
    <configuration name="cal_length" type="PythonConfigurationType" factoryName="Python" temporary="true" nameIsGenerated="true">
      <module name="verl" />
      <option name="ENV_FILES" value="" />
      <option name="INTERPRETER_OPTIONS" value="" />
      <option name="PARENT_ENVS" value="true" />
      <envs>
        <env name="PYTHONUNBUFFERED" value="1" />
      </envs>
      <option name="SDK_HOME" value="" />
      <option name="WORKING_DIRECTORY" value="$PROJECT_DIR$/data" />
      <option name="IS_MODULE_SDK" value="true" />
      <option name="ADD_CONTENT_ROOTS" value="true" />
      <option name="ADD_SOURCE_ROOTS" value="true" />
      <EXTENSION ID="PythonCoverageRunConfigurationExtension" runner="coverage.py" />
      <option name="SCRIPT_NAME" value="$PROJECT_DIR$/data/cal_length.py" />
      <option name="PARAMETERS" value="" />
      <option name="SHOW_COMMAND_LINE" value="false" />
      <option name="EMULATE_TERMINAL" value="false" />
      <option name="MODULE_MODE" value="false" />
      <option name="REDIRECT_INPUT" value="false" />
      <option name="INPUT_FILE" value="" />
      <method v="2" />
    </configuration>
    <configuration name="cal_length_feo" type="PythonConfigurationType" factoryName="Python" temporary="true" nameIsGenerated="true">
      <module name="verl" />
      <option name="ENV_FILES" value="" />
      <option name="INTERPRETER_OPTIONS" value="" />
      <option name="PARENT_ENVS" value="true" />
      <envs>
        <env name="PYTHONUNBUFFERED" value="1" />
      </envs>
      <option name="SDK_HOME" value="" />
      <option name="WORKING_DIRECTORY" value="$PROJECT_DIR$/data" />
      <option name="IS_MODULE_SDK" value="true" />
      <option name="ADD_CONTENT_ROOTS" value="true" />
      <option name="ADD_SOURCE_ROOTS" value="true" />
      <EXTENSION ID="PythonCoverageRunConfigurationExtension" runner="coverage.py" />
      <option name="SCRIPT_NAME" value="$PROJECT_DIR$/data/cal_length_feo.py" />
      <option name="PARAMETERS" value="" />
      <option name="SHOW_COMMAND_LINE" value="false" />
      <option name="EMULATE_TERMINAL" value="false" />
      <option name="MODULE_MODE" value="false" />
      <option name="REDIRECT_INPUT" value="false" />
      <option name="INPUT_FILE" value="" />
      <method v="2" />
    </configuration>
    <configuration name="main_eval" type="PythonConfigurationType" factoryName="Python" nameIsGenerated="true">
      <module name="verl" />
      <option name="ENV_FILES" value="" />
      <option name="INTERPRETER_OPTIONS" value="" />
      <option name="PARENT_ENVS" value="true" />
      <envs>
        <env name="PYTHONUNBUFFERED" value="1" />
      </envs>
      <option name="SDK_HOME" value="" />
      <option name="WORKING_DIRECTORY" value="" />
      <option name="IS_MODULE_SDK" value="false" />
      <option name="ADD_CONTENT_ROOTS" value="true" />
      <option name="ADD_SOURCE_ROOTS" value="true" />
      <EXTENSION ID="PythonCoverageRunConfigurationExtension" runner="coverage.py" />
      <option name="SCRIPT_NAME" value="$PROJECT_DIR$/verl/trainer/main_eval.py" />
      <option name="PARAMETERS" value="data.path='$PROJECT_DIR$/data/openai___gsm8k/test_qwen3-0.6B-alpha0.01-ewma_3_5_10_20_25(0)_30(0)_gen.parquet'" />
      <option name="SHOW_COMMAND_LINE" value="false" />
      <option name="EMULATE_TERMINAL" value="false" />
      <option name="MODULE_MODE" value="false" />
      <option name="REDIRECT_INPUT" value="false" />
      <option name="INPUT_FILE" value="" />
      <method v="2" />
    </configuration>
    <configuration name="main_generation" type="PythonConfigurationType" factoryName="Python" nameIsGenerated="true">
      <module name="verl" />
      <option name="ENV_FILES" value="" />
      <option name="INTERPRETER_OPTIONS" value="" />
      <option name="PARENT_ENVS" value="true" />
      <envs>
        <env name="PYTHONUNBUFFERED" value="1" />
        <env name="CUDA_VISIBLE_DEVICES" value="4,5,6,7" />
      </envs>
      <option name="SDK_HOME" value="" />
      <option name="WORKING_DIRECTORY" value="" />
      <option name="IS_MODULE_SDK" value="false" />
      <option name="ADD_CONTENT_ROOTS" value="true" />
      <option name="ADD_SOURCE_ROOTS" value="true" />
      <EXTENSION ID="PythonCoverageRunConfigurationExtension" runner="coverage.py" />
      <option name="SCRIPT_NAME" value="$PROJECT_DIR$/verl/trainer/main_generation.py" />
      <option name="PARAMETERS" value="trainer.nnodes=1 trainer.n_gpus_per_node=4 data.path=$PROJECT_DIR$/data/openai___gsm8k/test.parquet data.prompt_key=prompt data.n_samples=1 data.output_path='$PROJECT_DIR$/data/openai___gsm8k/test_qwen3-0.6B-alpha0.01-ewma_3_5_10_20_25(0)_30(0)_gen.parquet' model.path='$PROJECT_DIR$/checkpoints/verl_grpo_example_gsm8k/Qwen3-0.6B-alpha0.01-ewma_3_5_10_20_25(0)_30(0)/huggingface/global_step_109' +model.trust_remote_code=True rollout.load_format=safetensors rollout.prompt_length=256 rollout.response_length=3072 rollout.tensor_model_parallel_size=1 rollout.gpu_memory_utilization=0.8" />
      <option name="SHOW_COMMAND_LINE" value="false" />
      <option name="EMULATE_TERMINAL" value="false" />
      <option name="MODULE_MODE" value="false" />
      <option name="REDIRECT_INPUT" value="false" />
      <option name="INPUT_FILE" value="" />
      <method v="2" />
    </configuration>
    <configuration name="main_ppo" type="PythonConfigurationType" factoryName="Python" nameIsGenerated="true">
      <module name="verl" />
      <option name="ENV_FILES" value="" />
      <option name="INTERPRETER_OPTIONS" value="" />
      <option name="PARENT_ENVS" value="true" />
      <envs>
        <env name="PYTHONUNBUFFERED" value="1" />
        <env name="CUDA_VISIBLE_DEVICES" value="4,5,6,7" />
      </envs>
      <option name="SDK_HOME" value="" />
      <option name="WORKING_DIRECTORY" value="" />
      <option name="IS_MODULE_SDK" value="false" />
      <option name="ADD_CONTENT_ROOTS" value="true" />
      <option name="ADD_SOURCE_ROOTS" value="true" />
      <EXTENSION ID="PythonCoverageRunConfigurationExtension" runner="coverage.py" />
      <option name="SCRIPT_NAME" value="$PROJECT_DIR$/verl/trainer/main_ppo.py" />
      <option name="PARAMETERS" value="algorithm.adv_estimator=grpo data.train_files=$PROJECT_DIR$/data/DigitalLearningGmbH___math-lighteval/train.parquet data.val_files=$PROJECT_DIR$/data/DigitalLearningGmbH___math-lighteval/test.parquet data.train_batch_size=64 data.max_prompt_length=256 data.max_response_length=3072 data.filter_overlong_prompts=True data.truncation='error' actor_rollout_ref.model.path=&quot;$PROJECT_DIR$/../models/DeepSeek-R1-Distill-Qwen-1.5B&quot; actor_rollout_ref.actor.optim.lr=5e-7 actor_rollout_ref.model.use_remove_padding=True actor_rollout_ref.actor.ppo_mini_batch_size=64 actor_rollout_ref.actor.ppo_micro_batch_size_per_gpu=1 actor_rollout_ref.actor.use_kl_loss=True actor_rollout_ref.actor.kl_loss_coef=0.001 actor_rollout_ref.actor.kl_loss_type=low_var_kl actor_rollout_ref.actor.entropy_coeff=0 actor_rollout_ref.model.enable_gradient_checkpointing=True actor_rollout_ref.actor.fsdp_config.param_offload=True actor_rollout_ref.actor.fsdp_config.optimizer_offload=True actor_rollout_ref.rollout.log_prob_micro_batch_size_per_gpu=16 actor_rollout_ref.rollout.tensor_model_parallel_size=4 actor_rollout_ref.rollout.name=vllm actor_rollout_ref.rollout.gpu_memory_utilization=0.7 actor_rollout_ref.rollout.n=16 actor_rollout_ref.ref.log_prob_micro_batch_size_per_gpu=16 actor_rollout_ref.ref.fsdp_config.param_offload=True algorithm.use_kl_in_reward=False trainer.critic_warmup=0 trainer.logger=['console','tensorboard'] trainer.project_name='verl_grpo_example_math' trainer.experiment_name='DeepSeek-R1-Distill-Qwen-1.5B-alpha0.01-ewma_3_5_10_20_25(0)_30(0)-test' trainer.n_gpus_per_node=4 trainer.nnodes=1 trainer.save_freq=1 trainer.test_freq=116 trainer.total_epochs=1 trainer.balance_batch=False actor_rollout_ref.rollout.val_kwargs.n=16 custom_reward_function.path=$PROJECT_DIR$/verl/utils/reward_score/correct_length.py reward_model.reward_manager='naive_length' trainer.val_before_train=False actor_rollout_ref.actor.ulysses_sequence_parallel_size=2 actor_rollout_ref.model.use_remove_padding=True actor_rollout_ref.model.enable_gradient_checkpointing=True actor_rollout_ref.model.use_shm=True actor_rollout_ref.rollout.layered_summon=True" />
      <option name="SHOW_COMMAND_LINE" value="false" />
      <option name="EMULATE_TERMINAL" value="false" />
      <option name="MODULE_MODE" value="false" />
      <option name="REDIRECT_INPUT" value="false" />
      <option name="INPUT_FILE" value="" />
      <method v="2" />
    </configuration>
    <configuration name="main_ppo2" type="PythonConfigurationType" factoryName="Python">
      <module name="verl" />
      <option name="ENV_FILES" value="" />
      <option name="INTERPRETER_OPTIONS" value="" />
      <option name="PARENT_ENVS" value="true" />
      <envs>
        <env name="PYTHONUNBUFFERED" value="1" />
        <env name="CUDA_VISIBLE_DEVICES" value="4,5,6,7" />
      </envs>
      <option name="SDK_HOME" value="" />
      <option name="WORKING_DIRECTORY" value="" />
      <option name="IS_MODULE_SDK" value="false" />
      <option name="ADD_CONTENT_ROOTS" value="true" />
      <option name="ADD_SOURCE_ROOTS" value="true" />
      <EXTENSION ID="PythonCoverageRunConfigurationExtension" runner="coverage.py" />
      <option name="SCRIPT_NAME" value="$PROJECT_DIR$/verl/trainer/main_ppo.py" />
      <option name="PARAMETERS" value="algorithm.adv_estimator=grpo data.train_files=$PROJECT_DIR$/data/openai___gsm8k/train.parquet data.val_files=$PROJECT_DIR$/data/openai___gsm8k/test.parquet data.train_batch_size=64 data.max_prompt_length=256 data.max_response_length=3072 data.filter_overlong_prompts=True data.truncation='error' actor_rollout_ref.model.path=&quot;$PROJECT_DIR$/../models/Qwen3-1.7B&quot; actor_rollout_ref.actor.optim.lr=5e-7 actor_rollout_ref.model.use_remove_padding=True actor_rollout_ref.actor.ppo_mini_batch_size=64 actor_rollout_ref.actor.ppo_micro_batch_size_per_gpu=1 actor_rollout_ref.actor.use_kl_loss=True actor_rollout_ref.actor.kl_loss_coef=0.001 actor_rollout_ref.actor.kl_loss_type=low_var_kl actor_rollout_ref.actor.entropy_coeff=0 actor_rollout_ref.model.enable_gradient_checkpointing=True actor_rollout_ref.actor.fsdp_config.param_offload=True actor_rollout_ref.actor.fsdp_config.optimizer_offload=True actor_rollout_ref.rollout.log_prob_micro_batch_size_per_gpu=16 actor_rollout_ref.rollout.tensor_model_parallel_size=4 actor_rollout_ref.rollout.name=vllm actor_rollout_ref.rollout.gpu_memory_utilization=0.7 actor_rollout_ref.rollout.n=16 actor_rollout_ref.ref.log_prob_micro_batch_size_per_gpu=16 actor_rollout_ref.ref.fsdp_config.param_offload=True algorithm.use_kl_in_reward=False trainer.critic_warmup=0 trainer.logger=['console','tensorboard'] trainer.project_name='verl_grpo_example_gsm8k' trainer.experiment_name='Qwen3-1.7B-alpha0.01-ewma_3_5_10_20_25(0)_30(0)' trainer.n_gpus_per_node=4 trainer.nnodes=1 trainer.save_freq=1 trainer.test_freq=116 trainer.total_epochs=1 trainer.balance_batch=False actor_rollout_ref.rollout.val_kwargs.n=16 custom_reward_function.path=$PROJECT_DIR$/verl/utils/reward_score/correct_length2.py reward_model.reward_manager='naive_no_length' trainer.val_before_train=False actor_rollout_ref.actor.ulysses_sequence_parallel_size=2 actor_rollout_ref.model.use_remove_padding=True actor_rollout_ref.model.enable_gradient_checkpointing=True actor_rollout_ref.model.use_shm=True actor_rollout_ref.rollout.layered_summon=True" />
      <option name="SHOW_COMMAND_LINE" value="false" />
      <option name="EMULATE_TERMINAL" value="false" />
      <option name="MODULE_MODE" value="false" />
      <option name="REDIRECT_INPUT" value="false" />
      <option name="INPUT_FILE" value="" />
      <method v="2" />
    </configuration>
    <configuration name="未命名" type="ShConfigurationType" nameIsGenerated="true">
      <option name="SCRIPT_TEXT" value="" />
      <option name="INDEPENDENT_SCRIPT_PATH" value="true" />
      <option name="SCRIPT_PATH" value="$PROJECT_DIR$/exp_scripts/run_qwen3_0.6b_grpo.sh" />
      <option name="SCRIPT_OPTIONS" value="" />
      <option name="INDEPENDENT_SCRIPT_WORKING_DIRECTORY" value="true" />
      <option name="SCRIPT_WORKING_DIRECTORY" value="$PROJECT_DIR$" />
      <option name="INDEPENDENT_INTERPRETER_PATH" value="true" />
      <option name="INTERPRETER_PATH" value="/bin/bash" />
      <option name="INTERPRETER_OPTIONS" value="" />
      <option name="EXECUTE_IN_TERMINAL" value="true" />
      <option name="EXECUTE_SCRIPT_FILE" value="true" />
      <envs>
        <env name="CUDA_VISIBLE_DEVICES" value="0,1,2,3,4,5,6,7" />
      </envs>
      <method v="2" />
    </configuration>
    <configuration name="eval_for.sh" type="ShConfigurationType" temporary="true">
      <option name="SCRIPT_TEXT" value="" />
      <option name="INDEPENDENT_SCRIPT_PATH" value="true" />
      <option name="SCRIPT_PATH" value="$PROJECT_DIR$/data/eval_for.sh" />
      <option name="SCRIPT_OPTIONS" value="" />
      <option name="INDEPENDENT_SCRIPT_WORKING_DIRECTORY" value="true" />
      <option name="SCRIPT_WORKING_DIRECTORY" value="$PROJECT_DIR$/data" />
      <option name="INDEPENDENT_INTERPRETER_PATH" value="true" />
      <option name="INTERPRETER_PATH" value="/bin/bash" />
      <option name="INTERPRETER_OPTIONS" value="" />
      <option name="EXECUTE_IN_TERMINAL" value="true" />
      <option name="EXECUTE_SCRIPT_FILE" value="true" />
      <envs />
      <method v="2" />
    </configuration>
    <configuration name="pt2hf.sh" type="ShConfigurationType" temporary="true">
      <option name="SCRIPT_TEXT" value="" />
      <option name="INDEPENDENT_SCRIPT_PATH" value="true" />
      <option name="SCRIPT_PATH" value="$PROJECT_DIR$/checkpoints/pt2hf.sh" />
      <option name="SCRIPT_OPTIONS" value="" />
      <option name="INDEPENDENT_SCRIPT_WORKING_DIRECTORY" value="true" />
      <option name="SCRIPT_WORKING_DIRECTORY" value="$PROJECT_DIR$/checkpoints" />
      <option name="INDEPENDENT_INTERPRETER_PATH" value="true" />
      <option name="INTERPRETER_PATH" value="/bin/bash" />
      <option name="INTERPRETER_OPTIONS" value="" />
      <option name="EXECUTE_IN_TERMINAL" value="true" />
      <option name="EXECUTE_SCRIPT_FILE" value="true" />
      <envs />
      <method v="2" />
    </configuration>
    <list>
      <item itemvalue="Python.main_eval" />
      <item itemvalue="Python.main_generation" />
      <item itemvalue="Python.main_ppo" />
      <item itemvalue="Python.main_ppo2" />
      <item itemvalue="Python.cal_length_feo" />
      <item itemvalue="Python.amc23" />
      <item itemvalue="Python.cal_length" />
      <item itemvalue="Python 调试服务器.TaskRunner" />
      <item itemvalue="Python 调试服务器.generation" />
      <item itemvalue="Shell Script.未命名" />
      <item itemvalue="Shell Script.pt2hf.sh" />
      <item itemvalue="Shell Script.eval_for.sh" />
    </list>
    <recent_temporary>
      <list>
        <item itemvalue="Python.cal_length" />
        <item itemvalue="Shell Script.pt2hf.sh" />
        <item itemvalue="Python.cal_length_feo" />
        <item itemvalue="Shell Script.eval_for.sh" />
        <item itemvalue="Python.amc23" />
      </list>
    </recent_temporary>
  </component>
  <component name="SharedIndexes">
    <attachedChunks>
      <set>
        <option value="bundled-js-predefined-d6986cc7102b-09060db00ec0-JavaScript-PY-251.26927.90" />
        <option value="bundled-python-sdk-41e8cd69c857-64d779b69b7a-com.jetbrains.pycharm.pro.sharedIndexes.bundled-PY-251.26927.90" />
      </set>
    </attachedChunks>
  </component>
  <component name="SpellCheckerSettings" RuntimeDictionaries="0" Folders="0" CustomDictionaries="0" DefaultDictionary="应用程序级" UseSingleDictionary="true" transferred="true" />
  <component name="TaskManager">
    <task active="true" id="Default" summary="默认任务">
      <changelist id="b4c59053-994a-48ba-a980-ef0b979ffc77" name="更改" comment="" />
      <created>1751819810022</created>
      <option name="number" value="Default" />
      <option name="presentableId" value="Default" />
      <updated>1751819810022</updated>
      <workItem from="1751819811650" duration="31370000" />
      <workItem from="1752071941425" duration="16272000" />
      <workItem from="1752162649776" duration="2935000" />
      <workItem from="1752195723074" duration="22455000" />
      <workItem from="1752244188954" duration="29397000" />
      <workItem from="1756897422684" duration="16614000" />
      <workItem from="1756946310832" duration="44933000" />
      <workItem from="1757152048788" duration="9484000" />
      <workItem from="1757235903361" duration="13000" />
      <workItem from="1757259672581" duration="6678000" />
      <workItem from="1757317468792" duration="4106000" />
      <workItem from="1757328260485" duration="4000" />
      <workItem from="1757331357778" duration="65000" />
      <workItem from="1757331432141" duration="4908000" />
      <workItem from="1757337039560" duration="2515000" />
      <workItem from="1757342092195" duration="4675000" />
      <workItem from="1757491483546" duration="50264000" />
      <workItem from="1757750966574" duration="54456000" />
      <workItem from="1758190816218" duration="126419000" />
      <workItem from="1758636109970" duration="21376000" />
      <workItem from="1758796545172" duration="533000" />
    </task>
    <servers />
  </component>
  <component name="TypeScriptGeneratedFilesManager">
    <option name="version" value="3" />
  </component>
  <component name="XDebuggerManager">
    <breakpoint-manager>
      <breakpoints>
        <line-breakpoint enabled="true" suspend="THREAD" type="python-line">
          <url>file://$PROJECT_DIR$/verl/workers/reward_manager/naive.py</url>
          <line>74</line>
          <option name="timeStamp" value="41" />
        </line-breakpoint>
        <line-breakpoint enabled="true" suspend="THREAD" type="python-line">
          <url>file://$PROJECT_DIR$/verl/workers/reward_manager/naive_length.py</url>
          <line>143</line>
          <option name="timeStamp" value="70" />
        </line-breakpoint>
        <line-breakpoint enabled="true" suspend="THREAD" type="python-line">
          <url>file://$PROJECT_DIR$/verl/workers/reward_manager/naive_length.py</url>
          <line>141</line>
          <option name="timeStamp" value="71" />
        </line-breakpoint>
        <line-breakpoint enabled="true" suspend="THREAD" type="python-line">
          <url>file://$PROJECT_DIR$/verl/workers/reward_manager/naive_length.py</url>
          <line>131</line>
          <option name="timeStamp" value="72" />
        </line-breakpoint>
        <line-breakpoint enabled="true" suspend="THREAD" type="python-line">
          <url>file://$PROJECT_DIR$/data/cal_length.py</url>
          <line>8</line>
          <option name="timeStamp" value="73" />
        </line-breakpoint>
        <line-breakpoint enabled="true" suspend="THREAD" type="python-line">
          <url>file://$PROJECT_DIR$/data/cal_length.py</url>
          <line>24</line>
          <option name="timeStamp" value="74" />
        </line-breakpoint>
      </breakpoints>
    </breakpoint-manager>
  </component>
  <component name="com.intellij.coverage.CoverageDataManagerImpl">
    <SUITE FILE_PATH="coverage/verl$lora_merge.coverage" NAME="lora_merge 覆盖结果" MODIFIED="1756993943442" SOURCE_PROVIDER="com.intellij.coverage.DefaultCoverageFileProvider" RUNNER="coverage.py" COVERAGE_BY_TEST_ENABLED="false" COVERAGE_TRACING_ENABLED="false" WORKING_DIRECTORY="$PROJECT_DIR$/checkpoints" />
    <SUITE FILE_PATH="coverage/verl$AIME2025.coverage" NAME="AIME2025 覆盖结果" MODIFIED="1758508681440" SOURCE_PROVIDER="com.intellij.coverage.DefaultCoverageFileProvider" RUNNER="coverage.py" COVERAGE_BY_TEST_ENABLED="false" COVERAGE_TRACING_ENABLED="false" WORKING_DIRECTORY="$PROJECT_DIR$/examples/data_preprocess" />
    <SUITE FILE_PATH="coverage/verl$model_download.coverage" NAME="model_download 覆盖结果" MODIFIED="1757063621077" SOURCE_PROVIDER="com.intellij.coverage.DefaultCoverageFileProvider" RUNNER="coverage.py" COVERAGE_BY_TEST_ENABLED="false" COVERAGE_TRACING_ENABLED="false" WORKING_DIRECTORY="$PROJECT_DIR$" />
    <SUITE FILE_PATH="coverage/verl$main_ppo2.coverage" NAME="main_ppo2 覆盖结果" MODIFIED="1758532823008" SOURCE_PROVIDER="com.intellij.coverage.DefaultCoverageFileProvider" RUNNER="coverage.py" COVERAGE_BY_TEST_ENABLED="false" COVERAGE_TRACING_ENABLED="false" WORKING_DIRECTORY="" />
    <SUITE FILE_PATH="coverage/verl$main_generation.coverage" NAME="main_generation 覆盖结果" MODIFIED="1758697945949" SOURCE_PROVIDER="com.intellij.coverage.DefaultCoverageFileProvider" RUNNER="coverage.py" COVERAGE_BY_TEST_ENABLED="false" COVERAGE_TRACING_ENABLED="false" WORKING_DIRECTORY="" />
    <SUITE FILE_PATH="coverage/verl$222.coverage" NAME="222 覆盖结果" MODIFIED="1756994146395" SOURCE_PROVIDER="com.intellij.coverage.DefaultCoverageFileProvider" RUNNER="coverage.py" COVERAGE_BY_TEST_ENABLED="false" COVERAGE_TRACING_ENABLED="false" WORKING_DIRECTORY="$PROJECT_DIR$" />
    <SUITE FILE_PATH="coverage/verl$main_eval.coverage" NAME="main_eval 覆盖结果" MODIFIED="1758699356645" SOURCE_PROVIDER="com.intellij.coverage.DefaultCoverageFileProvider" RUNNER="coverage.py" COVERAGE_BY_TEST_ENABLED="false" COVERAGE_TRACING_ENABLED="false" WORKING_DIRECTORY="" />
    <SUITE FILE_PATH="coverage/verl$cal_length_feo.coverage" NAME="cal_length_feo 覆盖结果" MODIFIED="1758547985475" SOURCE_PROVIDER="com.intellij.coverage.DefaultCoverageFileProvider" RUNNER="coverage.py" COVERAGE_BY_TEST_ENABLED="false" COVERAGE_TRACING_ENABLED="false" WORKING_DIRECTORY="$PROJECT_DIR$/data" />
    <SUITE FILE_PATH="coverage/verl$111.coverage" NAME="111 覆盖结果" MODIFIED="1756991427344" SOURCE_PROVIDER="com.intellij.coverage.DefaultCoverageFileProvider" RUNNER="coverage.py" COVERAGE_BY_TEST_ENABLED="false" COVERAGE_TRACING_ENABLED="false" WORKING_DIRECTORY="$PROJECT_DIR$" />
    <SUITE FILE_PATH="coverage/verl$math500.coverage" NAME="math500 覆盖结果" MODIFIED="1758506703464" SOURCE_PROVIDER="com.intellij.coverage.DefaultCoverageFileProvider" RUNNER="coverage.py" COVERAGE_BY_TEST_ENABLED="false" COVERAGE_TRACING_ENABLED="false" WORKING_DIRECTORY="$PROJECT_DIR$/examples/data_preprocess" />
    <SUITE FILE_PATH="coverage/verl$gsm8k.coverage" NAME="gsm8k 覆盖结果" MODIFIED="1752405432815" SOURCE_PROVIDER="com.intellij.coverage.DefaultCoverageFileProvider" RUNNER="coverage.py" COVERAGE_BY_TEST_ENABLED="false" COVERAGE_TRACING_ENABLED="false" WORKING_DIRECTORY="$PROJECT_DIR$/examples/data_preprocess" />
    <SUITE FILE_PATH="coverage/verl$correct_length2.coverage" NAME="correct_length2 覆盖结果" MODIFIED="1758442754823" SOURCE_PROVIDER="com.intellij.coverage.DefaultCoverageFileProvider" RUNNER="coverage.py" COVERAGE_BY_TEST_ENABLED="false" COVERAGE_TRACING_ENABLED="false" WORKING_DIRECTORY="$PROJECT_DIR$/verl/utils/reward_score" />
    <SUITE FILE_PATH="coverage/verl$amc23.coverage" NAME="amc23 覆盖结果" MODIFIED="1758509077914" SOURCE_PROVIDER="com.intellij.coverage.DefaultCoverageFileProvider" RUNNER="coverage.py" COVERAGE_BY_TEST_ENABLED="false" COVERAGE_TRACING_ENABLED="false" WORKING_DIRECTORY="$PROJECT_DIR$/examples/data_preprocess" />
    <SUITE FILE_PATH="coverage/verl$AIME2024.coverage" NAME="AIME2024 覆盖结果" MODIFIED="1758463197153" SOURCE_PROVIDER="com.intellij.coverage.DefaultCoverageFileProvider" RUNNER="coverage.py" COVERAGE_BY_TEST_ENABLED="false" COVERAGE_TRACING_ENABLED="false" WORKING_DIRECTORY="$PROJECT_DIR$/examples/data_preprocess" />
    <SUITE FILE_PATH="coverage/verl$math_dataset.coverage" NAME="math_dataset 覆盖结果" MODIFIED="1752563112206" SOURCE_PROVIDER="com.intellij.coverage.DefaultCoverageFileProvider" RUNNER="coverage.py" COVERAGE_BY_TEST_ENABLED="false" COVERAGE_TRACING_ENABLED="false" WORKING_DIRECTORY="$PROJECT_DIR$/examples/data_preprocess" />
    <SUITE FILE_PATH="coverage/verl$main_ppo.coverage" NAME="main_ppo 覆盖结果" MODIFIED="1758698588686" SOURCE_PROVIDER="com.intellij.coverage.DefaultCoverageFileProvider" RUNNER="coverage.py" COVERAGE_BY_TEST_ENABLED="false" COVERAGE_TRACING_ENABLED="false" WORKING_DIRECTORY="" />
    <SUITE FILE_PATH="coverage/verl$cal_length.coverage" NAME="cal_length 覆盖结果" MODIFIED="1758698945772" SOURCE_PROVIDER="com.intellij.coverage.DefaultCoverageFileProvider" RUNNER="coverage.py" COVERAGE_BY_TEST_ENABLED="false" COVERAGE_TRACING_ENABLED="false" WORKING_DIRECTORY="$PROJECT_DIR$/data" />
    <SUITE FILE_PATH="coverage/verl$data_download.coverage" NAME="data_download 覆盖结果" MODIFIED="1758460000269" SOURCE_PROVIDER="com.intellij.coverage.DefaultCoverageFileProvider" RUNNER="coverage.py" COVERAGE_BY_TEST_ENABLED="false" COVERAGE_TRACING_ENABLED="false" WORKING_DIRECTORY="$PROJECT_DIR$" />
  </component>
</project>