Skip to content

Commit 67e8092

Browse files
committed
support qwen-3.5
1 parent edabb22 commit 67e8092

5 files changed

Lines changed: 16 additions & 16 deletions

File tree

ajet/default_config/ajet_default.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -28,7 +28,7 @@ class AjetData:
2828
@dataclass
2929
class AjetRollout:
3030
user_workflow: str = "tutorial.example_appworld.appworld->ExampleAgentScopeWorkflow"
31-
n_vllm_engine: int = 1
31+
n_vllm_engine: int = 1 # this argument is NOT effective when NOT using trinity
3232
tensor_model_parallel_size: int = 1
3333
num_repeat: int = 8
3434

ajet/default_config/verl/verl_default.yaml

Lines changed: 4 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -166,7 +166,7 @@ actor_rollout_ref:
166166
use_torch_compile: ${oc.select:actor_rollout_ref.actor.use_torch_compile,true}
167167
log_prob_micro_batch_size: null
168168
log_prob_micro_batch_size_per_gpu: null
169-
log_prob_use_dynamic_bsz: ${oc.select:actor_rollout_ref.actor.use_dynamic_bsz,false}
169+
log_prob_use_dynamic_bsz: true
170170
log_prob_max_token_len_per_gpu: ${oc.select:actor_rollout_ref.actor.ppo_max_token_len_per_gpu,16384}
171171
profiler:
172172
_target_: verl.utils.profiler.ProfilerConfig
@@ -248,7 +248,7 @@ actor_rollout_ref:
248248
dtype: bfloat16
249249
gpu_memory_utilization: 0.80
250250
ignore_eos: false
251-
enforce_eager: false
251+
enforce_eager: true
252252
cudagraph_capture_sizes: null
253253
free_cache_engine: true
254254
tensor_model_parallel_size: 1
@@ -265,7 +265,7 @@ actor_rollout_ref:
265265
load_format: dummy
266266
log_prob_micro_batch_size: null
267267
log_prob_micro_batch_size_per_gpu: 1
268-
log_prob_use_dynamic_bsz: ${oc.select:actor_rollout_ref.actor.use_dynamic_bsz,false}
268+
log_prob_use_dynamic_bsz: true
269269
log_prob_max_token_len_per_gpu: ${oc.select:actor_rollout_ref.actor.ppo_max_token_len_per_gpu,16384}
270270
disable_log_stats: true
271271
do_sample: true
@@ -508,7 +508,7 @@ critic:
508508
ppo_mini_batch_size: ${oc.select:actor_rollout_ref.actor.ppo_mini_batch_size,256}
509509
ppo_micro_batch_size: null
510510
ppo_micro_batch_size_per_gpu: ${oc.select:.ppo_micro_batch_size,null}
511-
use_dynamic_bsz: ${oc.select:actor_rollout_ref.actor.use_dynamic_bsz,false}
511+
use_dynamic_bsz: true
512512
ppo_max_token_len_per_gpu: 32768
513513
forward_max_token_len_per_gpu: ${.ppo_max_token_len_per_gpu}
514514
ppo_epochs: ${oc.select:actor_rollout_ref.actor.ppo_epochs,1}

ajet/task_runner/base_runner.py

Lines changed: 6 additions & 6 deletions
Original file line numberDiff line numberDiff line change
@@ -82,12 +82,12 @@ async def wrapper_type_asyncio(self, workflow_cls: Type[Workflow], workflow_task
8282
# malloc garbage collection
8383
del user_workflow
8484

85-
# run gc in a thread-safe way
86-
if gc_lock.acquire(blocking=False):
87-
try:
88-
gc.collect()
89-
finally:
90-
gc_lock.release()
85+
# # run gc in a thread-safe way
86+
# if gc_lock.acquire(blocking=False):
87+
# try:
88+
# gc.collect()
89+
# finally:
90+
# gc_lock.release()
9191
return result
9292

9393

scripts/download_model.py

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -4,9 +4,9 @@
44
from loguru import logger
55
from modelscope import snapshot_download
66

7-
cache_dir = input("model path (./modelscope_cache): ").strip()
7+
cache_dir = input("model path (/mnt/data_cpfs/model_cache/modelscope/hub/Qwen): ").strip()
88
if not cache_dir:
9-
cache_dir = "./modelscope_cache"
9+
cache_dir = "/mnt/data_cpfs/model_cache/modelscope/hub/Qwen"
1010
res = snapshot_download(input("model name: ").strip(), cache_dir=cache_dir)
1111
logger.success(res)
1212

tests/bench/benchmark_math/benchmark_math.yaml

Lines changed: 3 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -14,7 +14,8 @@ ajet:
1414

1515
model:
1616
# ✨✨✨✨ 设置待训练的模型
17-
path: /mnt/data_cpfs/model_cache/modelscope/hub/Qwen/Qwen/Qwen2___5-7B-Instruct
17+
# path: /mnt/data_cpfs/model_cache/modelscope/hub/Qwen/Qwen/Qwen2___5-7B-Instruct
18+
path: /mnt/data_cpfs/model_cache/modelscope/hub/Qwen/Qwen/Qwen3.5-9B
1819

1920
rollout:
2021
user_workflow: "tutorial.example_math_agent.math_agent->ExampleMathLearn" # ✨✨✨✨ 编写并选择Agent
@@ -31,7 +32,6 @@ ajet:
3132
- "wrong_toolcall"
3233
max_response_length_in_one_turn: 1024
3334
max_model_len: 10000
34-
n_vllm_engine: 2
3535

3636
data:
3737
train_batch_size: 100
@@ -48,7 +48,7 @@ ajet:
4848
total_epochs: 100
4949
logger: swanlab
5050
nnodes: 1
51-
n_gpus_per_node: 4
51+
n_gpus_per_node: 8
5252

5353

5454

0 commit comments

Comments
 (0)