[
  {
    "error": "CUDA error: CUBLAS_STATUS_INVALID_VALUE when calling `cublasSgemmStridedBatched( handle, opa, opb, m, n, k, &alpha, a, lda, stridea, b, ldb, strideb, &beta, c, ldc, stridec, num_batches)`\nTraceback (most recent call last):\n  File \"/home/ray/default/scripts/run_qwen1.5b_distributed.py\", line 222, in train\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/working_dir_files/_ray_pkg_ad69431a81f9ddae/src/training/aceas_trainer.py\", line 963, in train\n    experiences = self._collect_experiences_local(\n                  ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/working_dir_files/_ray_pkg_ad69431a81f9ddae/src/training/aceas_trainer.py\", line 776, in _collect_experiences_local\n    outputs = self.model.generate(\n              ^^^^^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/peft/peft_model.py\", line 2048, in generate\n    outputs = self.base_model.generate(*args, **kwargs)\n              ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/torch/utils/_contextlib.py\", line 124, in decorate_context\n    return func(*args, **kwargs)\n           ^^^^^^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/transformers/generation/utils.py\", line 2566, in generate\n    result = decoding_method(\n             ^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/transformers/generation/utils.py\", line 2786, in _sample\n    outputs = self(**model_inputs, return_dict=True)\n              ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/torch/nn/modules/module.py\", line 1776, in _wrapped_call_impl\n    return self._call_impl(*args, **kwargs)\n           ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/torch/nn/modules/module.py\", line 1787, in _call_impl\n    return forward_call(*args, **kwargs)\n           ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/transformers/utils/generic.py\", line 918, in wrapper\n    output = func(self, *args, **kwargs)\n             ^^^^^^^^^^^^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/transformers/models/qwen2/modeling_qwen2.py\", line 449, in forward\n    outputs: BaseModelOutputWithPast = self.model(\n                                       ^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/torch/nn/modules/module.py\", line 1776, in _wrapped_call_impl\n    return self._call_impl(*args, **kwargs)\n           ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/torch/nn/modules/module.py\", line 1787, in _call_impl\n    return forward_call(*args, **kwargs)\n           ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/transformers/utils/generic.py\", line 1072, in wrapper\n    outputs = func(self, *args, **kwargs)\n              ^^^^^^^^^^^^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/transformers/models/qwen2/modeling_qwen2.py\", line 384, in forward\n    hidden_states = decoder_layer(\n                    ^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/transformers/modeling_layers.py\", line 94, in __call__\n    return super().__call__(*args, **kwargs)\n           ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/torch/nn/modules/module.py\", line 1776, in _wrapped_call_impl\n    return self._call_impl(*args, **kwargs)\n           ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/torch/nn/modules/module.py\", line 1787, in _call_impl\n    return forward_call(*args, **kwargs)\n           ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/transformers/utils/deprecation.py\", line 172, in wrapped_func\n    return func(*args, **kwargs)\n           ^^^^^^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/transformers/models/qwen2/modeling_qwen2.py\", line 234, in forward\n    hidden_states, _ = self.self_attn(\n                       ^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/torch/nn/modules/module.py\", line 1776, in _wrapped_call_impl\n    return self._call_impl(*args, **kwargs)\n           ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/torch/nn/modules/module.py\", line 1787, in _call_impl\n    return forward_call(*args, **kwargs)\n           ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/transformers/utils/deprecation.py\", line 172, in wrapped_func\n    return func(*args, **kwargs)\n           ^^^^^^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/transformers/models/qwen2/modeling_qwen2.py\", line 169, in forward\n    attn_output, attn_weights = attention_interface(\n                                ^^^^^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/transformers/models/qwen2/modeling_qwen2.py\", line 109, in eager_attention_forward\n    attn_weights = torch.matmul(query, key_states.transpose(2, 3)) * scaling\n                   ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^\nRuntimeError: CUDA error: CUBLAS_STATUS_INVALID_VALUE when calling `cublasSgemmStridedBatched( handle, opa, opb, m, n, k, &alpha, a, lda, stridea, b, ldb, strideb, &beta, c, ldc, stridec, num_batches)`\n",
    "method": "sync",
    "seed": 42
  },
  {
    "error": "CUDA error: CUBLAS_STATUS_INVALID_VALUE when calling `cublasSgemmStridedBatched( handle, opa, opb, m, n, k, &alpha, a, lda, stridea, b, ldb, strideb, &beta, c, ldc, stridec, num_batches)`\nTraceback (most recent call last):\n  File \"/home/ray/default/scripts/run_qwen1.5b_distributed.py\", line 222, in train\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/working_dir_files/_ray_pkg_ad69431a81f9ddae/src/training/aceas_trainer.py\", line 963, in train\n    experiences = self._collect_experiences_local(\n                  ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/working_dir_files/_ray_pkg_ad69431a81f9ddae/src/training/aceas_trainer.py\", line 776, in _collect_experiences_local\n    outputs = self.model.generate(\n              ^^^^^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/peft/peft_model.py\", line 2048, in generate\n    outputs = self.base_model.generate(*args, **kwargs)\n              ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/torch/utils/_contextlib.py\", line 124, in decorate_context\n    return func(*args, **kwargs)\n           ^^^^^^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/transformers/generation/utils.py\", line 2566, in generate\n    result = decoding_method(\n             ^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/transformers/generation/utils.py\", line 2786, in _sample\n    outputs = self(**model_inputs, return_dict=True)\n              ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/torch/nn/modules/module.py\", line 1776, in _wrapped_call_impl\n    return self._call_impl(*args, **kwargs)\n           ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/torch/nn/modules/module.py\", line 1787, in _call_impl\n    return forward_call(*args, **kwargs)\n           ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/transformers/utils/generic.py\", line 918, in wrapper\n    output = func(self, *args, **kwargs)\n             ^^^^^^^^^^^^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/transformers/models/qwen2/modeling_qwen2.py\", line 449, in forward\n    outputs: BaseModelOutputWithPast = self.model(\n                                       ^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/torch/nn/modules/module.py\", line 1776, in _wrapped_call_impl\n    return self._call_impl(*args, **kwargs)\n           ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/torch/nn/modules/module.py\", line 1787, in _call_impl\n    return forward_call(*args, **kwargs)\n           ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/transformers/utils/generic.py\", line 1072, in wrapper\n    outputs = func(self, *args, **kwargs)\n              ^^^^^^^^^^^^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/transformers/models/qwen2/modeling_qwen2.py\", line 384, in forward\n    hidden_states = decoder_layer(\n                    ^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/transformers/modeling_layers.py\", line 94, in __call__\n    return super().__call__(*args, **kwargs)\n           ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/torch/nn/modules/module.py\", line 1776, in _wrapped_call_impl\n    return self._call_impl(*args, **kwargs)\n           ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/torch/nn/modules/module.py\", line 1787, in _call_impl\n    return forward_call(*args, **kwargs)\n           ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/transformers/utils/deprecation.py\", line 172, in wrapped_func\n    return func(*args, **kwargs)\n           ^^^^^^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/transformers/models/qwen2/modeling_qwen2.py\", line 234, in forward\n    hidden_states, _ = self.self_attn(\n                       ^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/torch/nn/modules/module.py\", line 1776, in _wrapped_call_impl\n    return self._call_impl(*args, **kwargs)\n           ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/torch/nn/modules/module.py\", line 1787, in _call_impl\n    return forward_call(*args, **kwargs)\n           ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/transformers/utils/deprecation.py\", line 172, in wrapped_func\n    return func(*args, **kwargs)\n           ^^^^^^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/transformers/models/qwen2/modeling_qwen2.py\", line 169, in forward\n    attn_output, attn_weights = attention_interface(\n                                ^^^^^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/transformers/models/qwen2/modeling_qwen2.py\", line 109, in eager_attention_forward\n    attn_weights = torch.matmul(query, key_states.transpose(2, 3)) * scaling\n                   ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^\nRuntimeError: CUDA error: CUBLAS_STATUS_INVALID_VALUE when calling `cublasSgemmStridedBatched( handle, opa, opb, m, n, k, &alpha, a, lda, stridea, b, ldb, strideb, &beta, c, ldc, stridec, num_batches)`\n",
    "method": "sync",
    "seed": 123
  },
  {
    "error": "CUDA error: CUBLAS_STATUS_INVALID_VALUE when calling `cublasSgemmStridedBatched( handle, opa, opb, m, n, k, &alpha, a, lda, stridea, b, ldb, strideb, &beta, c, ldc, stridec, num_batches)`\nTraceback (most recent call last):\n  File \"/home/ray/default/scripts/run_qwen1.5b_distributed.py\", line 222, in train\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/working_dir_files/_ray_pkg_ad69431a81f9ddae/src/training/aceas_trainer.py\", line 963, in train\n    experiences = self._collect_experiences_local(\n                  ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/working_dir_files/_ray_pkg_ad69431a81f9ddae/src/training/aceas_trainer.py\", line 776, in _collect_experiences_local\n    outputs = self.model.generate(\n              ^^^^^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/peft/peft_model.py\", line 2048, in generate\n    outputs = self.base_model.generate(*args, **kwargs)\n              ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/torch/utils/_contextlib.py\", line 124, in decorate_context\n    return func(*args, **kwargs)\n           ^^^^^^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/transformers/generation/utils.py\", line 2566, in generate\n    result = decoding_method(\n             ^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/transformers/generation/utils.py\", line 2786, in _sample\n    outputs = self(**model_inputs, return_dict=True)\n              ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/torch/nn/modules/module.py\", line 1776, in _wrapped_call_impl\n    return self._call_impl(*args, **kwargs)\n           ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/torch/nn/modules/module.py\", line 1787, in _call_impl\n    return forward_call(*args, **kwargs)\n           ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/transformers/utils/generic.py\", line 918, in wrapper\n    output = func(self, *args, **kwargs)\n             ^^^^^^^^^^^^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/transformers/models/qwen2/modeling_qwen2.py\", line 449, in forward\n    outputs: BaseModelOutputWithPast = self.model(\n                                       ^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/torch/nn/modules/module.py\", line 1776, in _wrapped_call_impl\n    return self._call_impl(*args, **kwargs)\n           ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/torch/nn/modules/module.py\", line 1787, in _call_impl\n    return forward_call(*args, **kwargs)\n           ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/transformers/utils/generic.py\", line 1072, in wrapper\n    outputs = func(self, *args, **kwargs)\n              ^^^^^^^^^^^^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/transformers/models/qwen2/modeling_qwen2.py\", line 384, in forward\n    hidden_states = decoder_layer(\n                    ^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/transformers/modeling_layers.py\", line 94, in __call__\n    return super().__call__(*args, **kwargs)\n           ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/torch/nn/modules/module.py\", line 1776, in _wrapped_call_impl\n    return self._call_impl(*args, **kwargs)\n           ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/torch/nn/modules/module.py\", line 1787, in _call_impl\n    return forward_call(*args, **kwargs)\n           ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/transformers/utils/deprecation.py\", line 172, in wrapped_func\n    return func(*args, **kwargs)\n           ^^^^^^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/transformers/models/qwen2/modeling_qwen2.py\", line 234, in forward\n    hidden_states, _ = self.self_attn(\n                       ^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/torch/nn/modules/module.py\", line 1776, in _wrapped_call_impl\n    return self._call_impl(*args, **kwargs)\n           ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/torch/nn/modules/module.py\", line 1787, in _call_impl\n    return forward_call(*args, **kwargs)\n           ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/transformers/utils/deprecation.py\", line 172, in wrapped_func\n    return func(*args, **kwargs)\n           ^^^^^^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/transformers/models/qwen2/modeling_qwen2.py\", line 169, in forward\n    attn_output, attn_weights = attention_interface(\n                                ^^^^^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/transformers/models/qwen2/modeling_qwen2.py\", line 109, in eager_attention_forward\n    attn_weights = torch.matmul(query, key_states.transpose(2, 3)) * scaling\n                   ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^\nRuntimeError: CUDA error: CUBLAS_STATUS_INVALID_VALUE when calling `cublasSgemmStridedBatched( handle, opa, opb, m, n, k, &alpha, a, lda, stridea, b, ldb, strideb, &beta, c, ldc, stridec, num_batches)`\n",
    "method": "sync",
    "seed": 456
  },
  {
    "error": "CUDA error: CUBLAS_STATUS_INVALID_VALUE when calling `cublasSgemmStridedBatched( handle, opa, opb, m, n, k, &alpha, a, lda, stridea, b, ldb, strideb, &beta, c, ldc, stridec, num_batches)`\nTraceback (most recent call last):\n  File \"/home/ray/default/scripts/run_qwen1.5b_distributed.py\", line 222, in train\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/working_dir_files/_ray_pkg_ad69431a81f9ddae/src/training/aceas_trainer.py\", line 963, in train\n    experiences = self._collect_experiences_local(\n                  ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/working_dir_files/_ray_pkg_ad69431a81f9ddae/src/training/aceas_trainer.py\", line 776, in _collect_experiences_local\n    outputs = self.model.generate(\n              ^^^^^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/peft/peft_model.py\", line 2048, in generate\n    outputs = self.base_model.generate(*args, **kwargs)\n              ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/torch/utils/_contextlib.py\", line 124, in decorate_context\n    return func(*args, **kwargs)\n           ^^^^^^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/transformers/generation/utils.py\", line 2566, in generate\n    result = decoding_method(\n             ^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/transformers/generation/utils.py\", line 2786, in _sample\n    outputs = self(**model_inputs, return_dict=True)\n              ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/torch/nn/modules/module.py\", line 1776, in _wrapped_call_impl\n    return self._call_impl(*args, **kwargs)\n           ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/torch/nn/modules/module.py\", line 1787, in _call_impl\n    return forward_call(*args, **kwargs)\n           ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/transformers/utils/generic.py\", line 918, in wrapper\n    output = func(self, *args, **kwargs)\n             ^^^^^^^^^^^^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/transformers/models/qwen2/modeling_qwen2.py\", line 449, in forward\n    outputs: BaseModelOutputWithPast = self.model(\n                                       ^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/torch/nn/modules/module.py\", line 1776, in _wrapped_call_impl\n    return self._call_impl(*args, **kwargs)\n           ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/torch/nn/modules/module.py\", line 1787, in _call_impl\n    return forward_call(*args, **kwargs)\n           ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/transformers/utils/generic.py\", line 1072, in wrapper\n    outputs = func(self, *args, **kwargs)\n              ^^^^^^^^^^^^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/transformers/models/qwen2/modeling_qwen2.py\", line 384, in forward\n    hidden_states = decoder_layer(\n                    ^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/transformers/modeling_layers.py\", line 94, in __call__\n    return super().__call__(*args, **kwargs)\n           ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/torch/nn/modules/module.py\", line 1776, in _wrapped_call_impl\n    return self._call_impl(*args, **kwargs)\n           ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/torch/nn/modules/module.py\", line 1787, in _call_impl\n    return forward_call(*args, **kwargs)\n           ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/transformers/utils/deprecation.py\", line 172, in wrapped_func\n    return func(*args, **kwargs)\n           ^^^^^^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/transformers/models/qwen2/modeling_qwen2.py\", line 234, in forward\n    hidden_states, _ = self.self_attn(\n                       ^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/torch/nn/modules/module.py\", line 1776, in _wrapped_call_impl\n    return self._call_impl(*args, **kwargs)\n           ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/torch/nn/modules/module.py\", line 1787, in _call_impl\n    return forward_call(*args, **kwargs)\n           ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/transformers/utils/deprecation.py\", line 172, in wrapped_func\n    return func(*args, **kwargs)\n           ^^^^^^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/transformers/models/qwen2/modeling_qwen2.py\", line 169, in forward\n    attn_output, attn_weights = attention_interface(\n                                ^^^^^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/transformers/models/qwen2/modeling_qwen2.py\", line 109, in eager_attention_forward\n    attn_weights = torch.matmul(query, key_states.transpose(2, 3)) * scaling\n                   ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^\nRuntimeError: CUDA error: CUBLAS_STATUS_INVALID_VALUE when calling `cublasSgemmStridedBatched( handle, opa, opb, m, n, k, &alpha, a, lda, stridea, b, ldb, strideb, &beta, c, ldc, stridec, num_batches)`\n",
    "method": "sync_curriculum",
    "seed": 42
  },
  {
    "error": "CUDA error: CUBLAS_STATUS_INVALID_VALUE when calling `cublasSgemmStridedBatched( handle, opa, opb, m, n, k, &alpha, a, lda, stridea, b, ldb, strideb, &beta, c, ldc, stridec, num_batches)`\nTraceback (most recent call last):\n  File \"/home/ray/default/scripts/run_qwen1.5b_distributed.py\", line 222, in train\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/working_dir_files/_ray_pkg_ad69431a81f9ddae/src/training/aceas_trainer.py\", line 963, in train\n    experiences = self._collect_experiences_local(\n                  ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/working_dir_files/_ray_pkg_ad69431a81f9ddae/src/training/aceas_trainer.py\", line 776, in _collect_experiences_local\n    outputs = self.model.generate(\n              ^^^^^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/peft/peft_model.py\", line 2048, in generate\n    outputs = self.base_model.generate(*args, **kwargs)\n              ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/torch/utils/_contextlib.py\", line 124, in decorate_context\n    return func(*args, **kwargs)\n           ^^^^^^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/transformers/generation/utils.py\", line 2566, in generate\n    result = decoding_method(\n             ^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/transformers/generation/utils.py\", line 2786, in _sample\n    outputs = self(**model_inputs, return_dict=True)\n              ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/torch/nn/modules/module.py\", line 1776, in _wrapped_call_impl\n    return self._call_impl(*args, **kwargs)\n           ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/torch/nn/modules/module.py\", line 1787, in _call_impl\n    return forward_call(*args, **kwargs)\n           ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/transformers/utils/generic.py\", line 918, in wrapper\n    output = func(self, *args, **kwargs)\n             ^^^^^^^^^^^^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/transformers/models/qwen2/modeling_qwen2.py\", line 449, in forward\n    outputs: BaseModelOutputWithPast = self.model(\n                                       ^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/torch/nn/modules/module.py\", line 1776, in _wrapped_call_impl\n    return self._call_impl(*args, **kwargs)\n           ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/torch/nn/modules/module.py\", line 1787, in _call_impl\n    return forward_call(*args, **kwargs)\n           ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/transformers/utils/generic.py\", line 1072, in wrapper\n    outputs = func(self, *args, **kwargs)\n              ^^^^^^^^^^^^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/transformers/models/qwen2/modeling_qwen2.py\", line 384, in forward\n    hidden_states = decoder_layer(\n                    ^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/transformers/modeling_layers.py\", line 94, in __call__\n    return super().__call__(*args, **kwargs)\n           ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/torch/nn/modules/module.py\", line 1776, in _wrapped_call_impl\n    return self._call_impl(*args, **kwargs)\n           ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/torch/nn/modules/module.py\", line 1787, in _call_impl\n    return forward_call(*args, **kwargs)\n           ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/transformers/utils/deprecation.py\", line 172, in wrapped_func\n    return func(*args, **kwargs)\n           ^^^^^^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/transformers/models/qwen2/modeling_qwen2.py\", line 234, in forward\n    hidden_states, _ = self.self_attn(\n                       ^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/torch/nn/modules/module.py\", line 1776, in _wrapped_call_impl\n    return self._call_impl(*args, **kwargs)\n           ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/torch/nn/modules/module.py\", line 1787, in _call_impl\n    return forward_call(*args, **kwargs)\n           ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/transformers/utils/deprecation.py\", line 172, in wrapped_func\n    return func(*args, **kwargs)\n           ^^^^^^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/transformers/models/qwen2/modeling_qwen2.py\", line 169, in forward\n    attn_output, attn_weights = attention_interface(\n                                ^^^^^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/transformers/models/qwen2/modeling_qwen2.py\", line 109, in eager_attention_forward\n    attn_weights = torch.matmul(query, key_states.transpose(2, 3)) * scaling\n                   ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^\nRuntimeError: CUDA error: CUBLAS_STATUS_INVALID_VALUE when calling `cublasSgemmStridedBatched( handle, opa, opb, m, n, k, &alpha, a, lda, stridea, b, ldb, strideb, &beta, c, ldc, stridec, num_batches)`\n",
    "method": "sync_curriculum",
    "seed": 123
  },
  {
    "error": "CUDA error: CUBLAS_STATUS_INVALID_VALUE when calling `cublasSgemmStridedBatched( handle, opa, opb, m, n, k, &alpha, a, lda, stridea, b, ldb, strideb, &beta, c, ldc, stridec, num_batches)`\nTraceback (most recent call last):\n  File \"/home/ray/default/scripts/run_qwen1.5b_distributed.py\", line 222, in train\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/working_dir_files/_ray_pkg_ad69431a81f9ddae/src/training/aceas_trainer.py\", line 963, in train\n    experiences = self._collect_experiences_local(\n                  ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/working_dir_files/_ray_pkg_ad69431a81f9ddae/src/training/aceas_trainer.py\", line 776, in _collect_experiences_local\n    outputs = self.model.generate(\n              ^^^^^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/peft/peft_model.py\", line 2048, in generate\n    outputs = self.base_model.generate(*args, **kwargs)\n              ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/torch/utils/_contextlib.py\", line 124, in decorate_context\n    return func(*args, **kwargs)\n           ^^^^^^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/transformers/generation/utils.py\", line 2566, in generate\n    result = decoding_method(\n             ^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/transformers/generation/utils.py\", line 2786, in _sample\n    outputs = self(**model_inputs, return_dict=True)\n              ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/torch/nn/modules/module.py\", line 1776, in _wrapped_call_impl\n    return self._call_impl(*args, **kwargs)\n           ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/torch/nn/modules/module.py\", line 1787, in _call_impl\n    return forward_call(*args, **kwargs)\n           ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/transformers/utils/generic.py\", line 918, in wrapper\n    output = func(self, *args, **kwargs)\n             ^^^^^^^^^^^^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/transformers/models/qwen2/modeling_qwen2.py\", line 449, in forward\n    outputs: BaseModelOutputWithPast = self.model(\n                                       ^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/torch/nn/modules/module.py\", line 1776, in _wrapped_call_impl\n    return self._call_impl(*args, **kwargs)\n           ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/torch/nn/modules/module.py\", line 1787, in _call_impl\n    return forward_call(*args, **kwargs)\n           ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/transformers/utils/generic.py\", line 1072, in wrapper\n    outputs = func(self, *args, **kwargs)\n              ^^^^^^^^^^^^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/transformers/models/qwen2/modeling_qwen2.py\", line 384, in forward\n    hidden_states = decoder_layer(\n                    ^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/transformers/modeling_layers.py\", line 94, in __call__\n    return super().__call__(*args, **kwargs)\n           ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/torch/nn/modules/module.py\", line 1776, in _wrapped_call_impl\n    return self._call_impl(*args, **kwargs)\n           ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/torch/nn/modules/module.py\", line 1787, in _call_impl\n    return forward_call(*args, **kwargs)\n           ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/transformers/utils/deprecation.py\", line 172, in wrapped_func\n    return func(*args, **kwargs)\n           ^^^^^^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/transformers/models/qwen2/modeling_qwen2.py\", line 234, in forward\n    hidden_states, _ = self.self_attn(\n                       ^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/torch/nn/modules/module.py\", line 1776, in _wrapped_call_impl\n    return self._call_impl(*args, **kwargs)\n           ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/torch/nn/modules/module.py\", line 1787, in _call_impl\n    return forward_call(*args, **kwargs)\n           ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/transformers/utils/deprecation.py\", line 172, in wrapped_func\n    return func(*args, **kwargs)\n           ^^^^^^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/transformers/models/qwen2/modeling_qwen2.py\", line 169, in forward\n    attn_output, attn_weights = attention_interface(\n                                ^^^^^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/transformers/models/qwen2/modeling_qwen2.py\", line 109, in eager_attention_forward\n    attn_weights = torch.matmul(query, key_states.transpose(2, 3)) * scaling\n                   ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^\nRuntimeError: CUDA error: CUBLAS_STATUS_INVALID_VALUE when calling `cublasSgemmStridedBatched( handle, opa, opb, m, n, k, &alpha, a, lda, stridea, b, ldb, strideb, &beta, c, ldc, stridec, num_batches)`\n",
    "method": "sync_curriculum",
    "seed": 456
  },
  {
    "error": "CUDA error: CUBLAS_STATUS_INVALID_VALUE when calling `cublasSgemmStridedBatched( handle, opa, opb, m, n, k, &alpha, a, lda, stridea, b, ldb, strideb, &beta, c, ldc, stridec, num_batches)`\nTraceback (most recent call last):\n  File \"/home/ray/default/scripts/run_qwen1.5b_distributed.py\", line 222, in train\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/working_dir_files/_ray_pkg_ad69431a81f9ddae/src/training/aceas_trainer.py\", line 963, in train\n    experiences = self._collect_experiences_local(\n                  ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/working_dir_files/_ray_pkg_ad69431a81f9ddae/src/training/aceas_trainer.py\", line 776, in _collect_experiences_local\n    outputs = self.model.generate(\n              ^^^^^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/peft/peft_model.py\", line 2048, in generate\n    outputs = self.base_model.generate(*args, **kwargs)\n              ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/torch/utils/_contextlib.py\", line 124, in decorate_context\n    return func(*args, **kwargs)\n           ^^^^^^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/transformers/generation/utils.py\", line 2566, in generate\n    result = decoding_method(\n             ^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/transformers/generation/utils.py\", line 2786, in _sample\n    outputs = self(**model_inputs, return_dict=True)\n              ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/torch/nn/modules/module.py\", line 1776, in _wrapped_call_impl\n    return self._call_impl(*args, **kwargs)\n           ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/torch/nn/modules/module.py\", line 1787, in _call_impl\n    return forward_call(*args, **kwargs)\n           ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/transformers/utils/generic.py\", line 918, in wrapper\n    output = func(self, *args, **kwargs)\n             ^^^^^^^^^^^^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/transformers/models/qwen2/modeling_qwen2.py\", line 449, in forward\n    outputs: BaseModelOutputWithPast = self.model(\n                                       ^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/torch/nn/modules/module.py\", line 1776, in _wrapped_call_impl\n    return self._call_impl(*args, **kwargs)\n           ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/torch/nn/modules/module.py\", line 1787, in _call_impl\n    return forward_call(*args, **kwargs)\n           ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/transformers/utils/generic.py\", line 1072, in wrapper\n    outputs = func(self, *args, **kwargs)\n              ^^^^^^^^^^^^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/transformers/models/qwen2/modeling_qwen2.py\", line 384, in forward\n    hidden_states = decoder_layer(\n                    ^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/transformers/modeling_layers.py\", line 94, in __call__\n    return super().__call__(*args, **kwargs)\n           ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/torch/nn/modules/module.py\", line 1776, in _wrapped_call_impl\n    return self._call_impl(*args, **kwargs)\n           ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/torch/nn/modules/module.py\", line 1787, in _call_impl\n    return forward_call(*args, **kwargs)\n           ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/transformers/utils/deprecation.py\", line 172, in wrapped_func\n    return func(*args, **kwargs)\n           ^^^^^^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/transformers/models/qwen2/modeling_qwen2.py\", line 234, in forward\n    hidden_states, _ = self.self_attn(\n                       ^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/torch/nn/modules/module.py\", line 1776, in _wrapped_call_impl\n    return self._call_impl(*args, **kwargs)\n           ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/torch/nn/modules/module.py\", line 1787, in _call_impl\n    return forward_call(*args, **kwargs)\n           ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/transformers/utils/deprecation.py\", line 172, in wrapped_func\n    return func(*args, **kwargs)\n           ^^^^^^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/transformers/models/qwen2/modeling_qwen2.py\", line 169, in forward\n    attn_output, attn_weights = attention_interface(\n                                ^^^^^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/transformers/models/qwen2/modeling_qwen2.py\", line 109, in eager_attention_forward\n    attn_weights = torch.matmul(query, key_states.transpose(2, 3)) * scaling\n                   ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^\nRuntimeError: CUDA error: CUBLAS_STATUS_INVALID_VALUE when calling `cublasSgemmStridedBatched( handle, opa, opb, m, n, k, &alpha, a, lda, stridea, b, ldb, strideb, &beta, c, ldc, stridec, num_batches)`\n",
    "method": "async",
    "seed": 42
  },
  {
    "error": "CUDA error: CUBLAS_STATUS_INVALID_VALUE when calling `cublasSgemmStridedBatched( handle, opa, opb, m, n, k, &alpha, a, lda, stridea, b, ldb, strideb, &beta, c, ldc, stridec, num_batches)`\nTraceback (most recent call last):\n  File \"/home/ray/default/scripts/run_qwen1.5b_distributed.py\", line 222, in train\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/working_dir_files/_ray_pkg_ad69431a81f9ddae/src/training/aceas_trainer.py\", line 963, in train\n    experiences = self._collect_experiences_local(\n                  ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/working_dir_files/_ray_pkg_ad69431a81f9ddae/src/training/aceas_trainer.py\", line 776, in _collect_experiences_local\n    outputs = self.model.generate(\n              ^^^^^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/peft/peft_model.py\", line 2048, in generate\n    outputs = self.base_model.generate(*args, **kwargs)\n              ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/torch/utils/_contextlib.py\", line 124, in decorate_context\n    return func(*args, **kwargs)\n           ^^^^^^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/transformers/generation/utils.py\", line 2566, in generate\n    result = decoding_method(\n             ^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/transformers/generation/utils.py\", line 2786, in _sample\n    outputs = self(**model_inputs, return_dict=True)\n              ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/torch/nn/modules/module.py\", line 1776, in _wrapped_call_impl\n    return self._call_impl(*args, **kwargs)\n           ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/torch/nn/modules/module.py\", line 1787, in _call_impl\n    return forward_call(*args, **kwargs)\n           ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/transformers/utils/generic.py\", line 918, in wrapper\n    output = func(self, *args, **kwargs)\n             ^^^^^^^^^^^^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/transformers/models/qwen2/modeling_qwen2.py\", line 449, in forward\n    outputs: BaseModelOutputWithPast = self.model(\n                                       ^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/torch/nn/modules/module.py\", line 1776, in _wrapped_call_impl\n    return self._call_impl(*args, **kwargs)\n           ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/torch/nn/modules/module.py\", line 1787, in _call_impl\n    return forward_call(*args, **kwargs)\n           ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/transformers/utils/generic.py\", line 1072, in wrapper\n    outputs = func(self, *args, **kwargs)\n              ^^^^^^^^^^^^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/transformers/models/qwen2/modeling_qwen2.py\", line 384, in forward\n    hidden_states = decoder_layer(\n                    ^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/transformers/modeling_layers.py\", line 94, in __call__\n    return super().__call__(*args, **kwargs)\n           ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/torch/nn/modules/module.py\", line 1776, in _wrapped_call_impl\n    return self._call_impl(*args, **kwargs)\n           ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/torch/nn/modules/module.py\", line 1787, in _call_impl\n    return forward_call(*args, **kwargs)\n           ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/transformers/utils/deprecation.py\", line 172, in wrapped_func\n    return func(*args, **kwargs)\n           ^^^^^^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/transformers/models/qwen2/modeling_qwen2.py\", line 234, in forward\n    hidden_states, _ = self.self_attn(\n                       ^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/torch/nn/modules/module.py\", line 1776, in _wrapped_call_impl\n    return self._call_impl(*args, **kwargs)\n           ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/torch/nn/modules/module.py\", line 1787, in _call_impl\n    return forward_call(*args, **kwargs)\n           ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/transformers/utils/deprecation.py\", line 172, in wrapped_func\n    return func(*args, **kwargs)\n           ^^^^^^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/transformers/models/qwen2/modeling_qwen2.py\", line 169, in forward\n    attn_output, attn_weights = attention_interface(\n                                ^^^^^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/transformers/models/qwen2/modeling_qwen2.py\", line 109, in eager_attention_forward\n    attn_weights = torch.matmul(query, key_states.transpose(2, 3)) * scaling\n                   ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^\nRuntimeError: CUDA error: CUBLAS_STATUS_INVALID_VALUE when calling `cublasSgemmStridedBatched( handle, opa, opb, m, n, k, &alpha, a, lda, stridea, b, ldb, strideb, &beta, c, ldc, stridec, num_batches)`\n",
    "method": "async",
    "seed": 123
  },
  {
    "error": "CUDA error: CUBLAS_STATUS_INVALID_VALUE when calling `cublasSgemmStridedBatched( handle, opa, opb, m, n, k, &alpha, a, lda, stridea, b, ldb, strideb, &beta, c, ldc, stridec, num_batches)`\nTraceback (most recent call last):\n  File \"/home/ray/default/scripts/run_qwen1.5b_distributed.py\", line 222, in train\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/working_dir_files/_ray_pkg_ad69431a81f9ddae/src/training/aceas_trainer.py\", line 963, in train\n    experiences = self._collect_experiences_local(\n                  ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/working_dir_files/_ray_pkg_ad69431a81f9ddae/src/training/aceas_trainer.py\", line 776, in _collect_experiences_local\n    outputs = self.model.generate(\n              ^^^^^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/peft/peft_model.py\", line 2048, in generate\n    outputs = self.base_model.generate(*args, **kwargs)\n              ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/torch/utils/_contextlib.py\", line 124, in decorate_context\n    return func(*args, **kwargs)\n           ^^^^^^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/transformers/generation/utils.py\", line 2566, in generate\n    result = decoding_method(\n             ^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/transformers/generation/utils.py\", line 2786, in _sample\n    outputs = self(**model_inputs, return_dict=True)\n              ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/torch/nn/modules/module.py\", line 1776, in _wrapped_call_impl\n    return self._call_impl(*args, **kwargs)\n           ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/torch/nn/modules/module.py\", line 1787, in _call_impl\n    return forward_call(*args, **kwargs)\n           ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/transformers/utils/generic.py\", line 918, in wrapper\n    output = func(self, *args, **kwargs)\n             ^^^^^^^^^^^^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/transformers/models/qwen2/modeling_qwen2.py\", line 449, in forward\n    outputs: BaseModelOutputWithPast = self.model(\n                                       ^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/torch/nn/modules/module.py\", line 1776, in _wrapped_call_impl\n    return self._call_impl(*args, **kwargs)\n           ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/torch/nn/modules/module.py\", line 1787, in _call_impl\n    return forward_call(*args, **kwargs)\n           ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/transformers/utils/generic.py\", line 1072, in wrapper\n    outputs = func(self, *args, **kwargs)\n              ^^^^^^^^^^^^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/transformers/models/qwen2/modeling_qwen2.py\", line 384, in forward\n    hidden_states = decoder_layer(\n                    ^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/transformers/modeling_layers.py\", line 94, in __call__\n    return super().__call__(*args, **kwargs)\n           ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/torch/nn/modules/module.py\", line 1776, in _wrapped_call_impl\n    return self._call_impl(*args, **kwargs)\n           ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/torch/nn/modules/module.py\", line 1787, in _call_impl\n    return forward_call(*args, **kwargs)\n           ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/transformers/utils/deprecation.py\", line 172, in wrapped_func\n    return func(*args, **kwargs)\n           ^^^^^^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/transformers/models/qwen2/modeling_qwen2.py\", line 234, in forward\n    hidden_states, _ = self.self_attn(\n                       ^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/torch/nn/modules/module.py\", line 1776, in _wrapped_call_impl\n    return self._call_impl(*args, **kwargs)\n           ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/torch/nn/modules/module.py\", line 1787, in _call_impl\n    return forward_call(*args, **kwargs)\n           ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/transformers/utils/deprecation.py\", line 172, in wrapped_func\n    return func(*args, **kwargs)\n           ^^^^^^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/transformers/models/qwen2/modeling_qwen2.py\", line 169, in forward\n    attn_output, attn_weights = attention_interface(\n                                ^^^^^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/transformers/models/qwen2/modeling_qwen2.py\", line 109, in eager_attention_forward\n    attn_weights = torch.matmul(query, key_states.transpose(2, 3)) * scaling\n                   ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^\nRuntimeError: CUDA error: CUBLAS_STATUS_INVALID_VALUE when calling `cublasSgemmStridedBatched( handle, opa, opb, m, n, k, &alpha, a, lda, stridea, b, ldb, strideb, &beta, c, ldc, stridec, num_batches)`\n",
    "method": "async",
    "seed": 456
  },
  {
    "error": "CUDA error: CUBLAS_STATUS_INVALID_VALUE when calling `cublasSgemmStridedBatched( handle, opa, opb, m, n, k, &alpha, a, lda, stridea, b, ldb, strideb, &beta, c, ldc, stridec, num_batches)`\nTraceback (most recent call last):\n  File \"/home/ray/default/scripts/run_qwen1.5b_distributed.py\", line 222, in train\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/working_dir_files/_ray_pkg_ad69431a81f9ddae/src/training/aceas_trainer.py\", line 963, in train\n    experiences = self._collect_experiences_local(\n                  ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/working_dir_files/_ray_pkg_ad69431a81f9ddae/src/training/aceas_trainer.py\", line 776, in _collect_experiences_local\n    outputs = self.model.generate(\n              ^^^^^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/peft/peft_model.py\", line 2048, in generate\n    outputs = self.base_model.generate(*args, **kwargs)\n              ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/torch/utils/_contextlib.py\", line 124, in decorate_context\n    return func(*args, **kwargs)\n           ^^^^^^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/transformers/generation/utils.py\", line 2566, in generate\n    result = decoding_method(\n             ^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/transformers/generation/utils.py\", line 2786, in _sample\n    outputs = self(**model_inputs, return_dict=True)\n              ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/torch/nn/modules/module.py\", line 1776, in _wrapped_call_impl\n    return self._call_impl(*args, **kwargs)\n           ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/torch/nn/modules/module.py\", line 1787, in _call_impl\n    return forward_call(*args, **kwargs)\n           ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/transformers/utils/generic.py\", line 918, in wrapper\n    output = func(self, *args, **kwargs)\n             ^^^^^^^^^^^^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/transformers/models/qwen2/modeling_qwen2.py\", line 449, in forward\n    outputs: BaseModelOutputWithPast = self.model(\n                                       ^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/torch/nn/modules/module.py\", line 1776, in _wrapped_call_impl\n    return self._call_impl(*args, **kwargs)\n           ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/torch/nn/modules/module.py\", line 1787, in _call_impl\n    return forward_call(*args, **kwargs)\n           ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/transformers/utils/generic.py\", line 1072, in wrapper\n    outputs = func(self, *args, **kwargs)\n              ^^^^^^^^^^^^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/transformers/models/qwen2/modeling_qwen2.py\", line 384, in forward\n    hidden_states = decoder_layer(\n                    ^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/transformers/modeling_layers.py\", line 94, in __call__\n    return super().__call__(*args, **kwargs)\n           ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/torch/nn/modules/module.py\", line 1776, in _wrapped_call_impl\n    return self._call_impl(*args, **kwargs)\n           ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/torch/nn/modules/module.py\", line 1787, in _call_impl\n    return forward_call(*args, **kwargs)\n           ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/transformers/utils/deprecation.py\", line 172, in wrapped_func\n    return func(*args, **kwargs)\n           ^^^^^^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/transformers/models/qwen2/modeling_qwen2.py\", line 234, in forward\n    hidden_states, _ = self.self_attn(\n                       ^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/torch/nn/modules/module.py\", line 1776, in _wrapped_call_impl\n    return self._call_impl(*args, **kwargs)\n           ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/torch/nn/modules/module.py\", line 1787, in _call_impl\n    return forward_call(*args, **kwargs)\n           ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/transformers/utils/deprecation.py\", line 172, in wrapped_func\n    return func(*args, **kwargs)\n           ^^^^^^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/transformers/models/qwen2/modeling_qwen2.py\", line 169, in forward\n    attn_output, attn_weights = attention_interface(\n                                ^^^^^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/transformers/models/qwen2/modeling_qwen2.py\", line 109, in eager_attention_forward\n    attn_weights = torch.matmul(query, key_states.transpose(2, 3)) * scaling\n                   ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^\nRuntimeError: CUDA error: CUBLAS_STATUS_INVALID_VALUE when calling `cublasSgemmStridedBatched( handle, opa, opb, m, n, k, &alpha, a, lda, stridea, b, ldb, strideb, &beta, c, ldc, stridec, num_batches)`\n",
    "method": "aceas",
    "seed": 42
  },
  {
    "error": "CUDA error: CUBLAS_STATUS_INVALID_VALUE when calling `cublasSgemmStridedBatched( handle, opa, opb, m, n, k, &alpha, a, lda, stridea, b, ldb, strideb, &beta, c, ldc, stridec, num_batches)`\nTraceback (most recent call last):\n  File \"/home/ray/default/scripts/run_qwen1.5b_distributed.py\", line 222, in train\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/working_dir_files/_ray_pkg_ad69431a81f9ddae/src/training/aceas_trainer.py\", line 963, in train\n    experiences = self._collect_experiences_local(\n                  ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/working_dir_files/_ray_pkg_ad69431a81f9ddae/src/training/aceas_trainer.py\", line 776, in _collect_experiences_local\n    outputs = self.model.generate(\n              ^^^^^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/peft/peft_model.py\", line 2048, in generate\n    outputs = self.base_model.generate(*args, **kwargs)\n              ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/torch/utils/_contextlib.py\", line 124, in decorate_context\n    return func(*args, **kwargs)\n           ^^^^^^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/transformers/generation/utils.py\", line 2566, in generate\n    result = decoding_method(\n             ^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/transformers/generation/utils.py\", line 2786, in _sample\n    outputs = self(**model_inputs, return_dict=True)\n              ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/torch/nn/modules/module.py\", line 1776, in _wrapped_call_impl\n    return self._call_impl(*args, **kwargs)\n           ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/torch/nn/modules/module.py\", line 1787, in _call_impl\n    return forward_call(*args, **kwargs)\n           ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/transformers/utils/generic.py\", line 918, in wrapper\n    output = func(self, *args, **kwargs)\n             ^^^^^^^^^^^^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/transformers/models/qwen2/modeling_qwen2.py\", line 449, in forward\n    outputs: BaseModelOutputWithPast = self.model(\n                                       ^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/torch/nn/modules/module.py\", line 1776, in _wrapped_call_impl\n    return self._call_impl(*args, **kwargs)\n           ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/torch/nn/modules/module.py\", line 1787, in _call_impl\n    return forward_call(*args, **kwargs)\n           ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/transformers/utils/generic.py\", line 1072, in wrapper\n    outputs = func(self, *args, **kwargs)\n              ^^^^^^^^^^^^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/transformers/models/qwen2/modeling_qwen2.py\", line 384, in forward\n    hidden_states = decoder_layer(\n                    ^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/transformers/modeling_layers.py\", line 94, in __call__\n    return super().__call__(*args, **kwargs)\n           ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/torch/nn/modules/module.py\", line 1776, in _wrapped_call_impl\n    return self._call_impl(*args, **kwargs)\n           ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/torch/nn/modules/module.py\", line 1787, in _call_impl\n    return forward_call(*args, **kwargs)\n           ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/transformers/utils/deprecation.py\", line 172, in wrapped_func\n    return func(*args, **kwargs)\n           ^^^^^^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/transformers/models/qwen2/modeling_qwen2.py\", line 234, in forward\n    hidden_states, _ = self.self_attn(\n                       ^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/torch/nn/modules/module.py\", line 1776, in _wrapped_call_impl\n    return self._call_impl(*args, **kwargs)\n           ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/torch/nn/modules/module.py\", line 1787, in _call_impl\n    return forward_call(*args, **kwargs)\n           ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/transformers/utils/deprecation.py\", line 172, in wrapped_func\n    return func(*args, **kwargs)\n           ^^^^^^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/transformers/models/qwen2/modeling_qwen2.py\", line 169, in forward\n    attn_output, attn_weights = attention_interface(\n                                ^^^^^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/transformers/models/qwen2/modeling_qwen2.py\", line 109, in eager_attention_forward\n    attn_weights = torch.matmul(query, key_states.transpose(2, 3)) * scaling\n                   ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^\nRuntimeError: CUDA error: CUBLAS_STATUS_INVALID_VALUE when calling `cublasSgemmStridedBatched( handle, opa, opb, m, n, k, &alpha, a, lda, stridea, b, ldb, strideb, &beta, c, ldc, stridec, num_batches)`\n",
    "method": "aceas",
    "seed": 123
  },
  {
    "error": "CUDA error: CUBLAS_STATUS_INVALID_VALUE when calling `cublasSgemmStridedBatched( handle, opa, opb, m, n, k, &alpha, a, lda, stridea, b, ldb, strideb, &beta, c, ldc, stridec, num_batches)`\nTraceback (most recent call last):\n  File \"/home/ray/default/scripts/run_qwen1.5b_distributed.py\", line 222, in train\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/working_dir_files/_ray_pkg_ad69431a81f9ddae/src/training/aceas_trainer.py\", line 963, in train\n    experiences = self._collect_experiences_local(\n                  ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/working_dir_files/_ray_pkg_ad69431a81f9ddae/src/training/aceas_trainer.py\", line 776, in _collect_experiences_local\n    outputs = self.model.generate(\n              ^^^^^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/peft/peft_model.py\", line 2048, in generate\n    outputs = self.base_model.generate(*args, **kwargs)\n              ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/torch/utils/_contextlib.py\", line 124, in decorate_context\n    return func(*args, **kwargs)\n           ^^^^^^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/transformers/generation/utils.py\", line 2566, in generate\n    result = decoding_method(\n             ^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/transformers/generation/utils.py\", line 2786, in _sample\n    outputs = self(**model_inputs, return_dict=True)\n              ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/torch/nn/modules/module.py\", line 1776, in _wrapped_call_impl\n    return self._call_impl(*args, **kwargs)\n           ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/torch/nn/modules/module.py\", line 1787, in _call_impl\n    return forward_call(*args, **kwargs)\n           ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/transformers/utils/generic.py\", line 918, in wrapper\n    output = func(self, *args, **kwargs)\n             ^^^^^^^^^^^^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/transformers/models/qwen2/modeling_qwen2.py\", line 449, in forward\n    outputs: BaseModelOutputWithPast = self.model(\n                                       ^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/torch/nn/modules/module.py\", line 1776, in _wrapped_call_impl\n    return self._call_impl(*args, **kwargs)\n           ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/torch/nn/modules/module.py\", line 1787, in _call_impl\n    return forward_call(*args, **kwargs)\n           ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/transformers/utils/generic.py\", line 1072, in wrapper\n    outputs = func(self, *args, **kwargs)\n              ^^^^^^^^^^^^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/transformers/models/qwen2/modeling_qwen2.py\", line 384, in forward\n    hidden_states = decoder_layer(\n                    ^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/transformers/modeling_layers.py\", line 94, in __call__\n    return super().__call__(*args, **kwargs)\n           ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/torch/nn/modules/module.py\", line 1776, in _wrapped_call_impl\n    return self._call_impl(*args, **kwargs)\n           ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/torch/nn/modules/module.py\", line 1787, in _call_impl\n    return forward_call(*args, **kwargs)\n           ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/transformers/utils/deprecation.py\", line 172, in wrapped_func\n    return func(*args, **kwargs)\n           ^^^^^^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/transformers/models/qwen2/modeling_qwen2.py\", line 234, in forward\n    hidden_states, _ = self.self_attn(\n                       ^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/torch/nn/modules/module.py\", line 1776, in _wrapped_call_impl\n    return self._call_impl(*args, **kwargs)\n           ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/torch/nn/modules/module.py\", line 1787, in _call_impl\n    return forward_call(*args, **kwargs)\n           ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/transformers/utils/deprecation.py\", line 172, in wrapped_func\n    return func(*args, **kwargs)\n           ^^^^^^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/transformers/models/qwen2/modeling_qwen2.py\", line 169, in forward\n    attn_output, attn_weights = attention_interface(\n                                ^^^^^^^^^^^^^^^^^^^^\n  File \"/tmp/ray/session_2026-01-22_19-09-29_532237_2347/runtime_resources/pip/4ee19aa123619f754b42ef080d54bda2d9439af3/virtualenv/lib/python3.12/site-packages/transformers/models/qwen2/modeling_qwen2.py\", line 109, in eager_attention_forward\n    attn_weights = torch.matmul(query, key_states.transpose(2, 3)) * scaling\n                   ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^\nRuntimeError: CUDA error: CUBLAS_STATUS_INVALID_VALUE when calling `cublasSgemmStridedBatched( handle, opa, opb, m, n, k, &alpha, a, lda, stridea, b, ldb, strideb, &beta, c, ldc, stridec, num_batches)`\n",
    "method": "aceas",
    "seed": 456
  }
]