@@ -277,6 +277,193 @@ case:
277277 runtime_info/text_tokens : 0
278278 timeout : 1080
279279
280+ qwen3-sft-cache :
281+ -
282+ type : sft
283+ parameters :
284+ config : autotest/config/qwen3_sft_cache.py
285+ output_path : /mnt/shared-storage-user/llmrazor-share/qa-llm-cicd/test_output
286+ resource :
287+ cpus_per_task : 80
288+ envs :
289+ - QWEN3_MOE_PATH=/mnt/shared-storage-user/llmrazor-share/model/Qwen3-30B-A3B
290+ - ALPACA_PATH=/mnt/shared-storage-user/llmrazor-share/data/alpaca
291+ - CACHE_DIR=/mnt/shared-storage-user/llmrazor-share/qa-llm-cicd/.cache
292+ - XTUNER_DETERMINISTIC=true
293+ assert_info :
294+ base_metric : qwen3-sft-cache/e968368a/tracker.jsonl
295+ check_metrics :
296+ grad_norm : 0.000001
297+ loss/reduced_llm_loss : 0.000001
298+ lr : 0
299+ memory/max_memory_GB : 0.2
300+ runtime_info/tgs : 0.05
301+ runtime_info/text_tokens : 0
302+ timeout : 10800
303+
304+ qwen3-sft-vl-dense :
305+ -
306+ type : sft
307+ parameters :
308+ config : autotest/config/qwen3_vl_8B_dense.py
309+ output_path : /mnt/shared-storage-user/llmrazor-share/qa-llm-cicd/test_output
310+ resource :
311+ envs :
312+ - MODEL_PATH=/mnt/shared-storage-user/llmrazor-share/model/Qwen3-VL-8B-Instruct
313+ - DATA_PATH=/mnt/shared-storage-user/llmrazor-share/data/ci_vl
314+ - MEDIA_ROOT=/mnt/shared-storage-user/llmrazor-share/data/ci_vl
315+ - XTUNER_DETERMINISTIC=true
316+ assert_info :
317+ base_metric : qwen3-sft-vl-dense/812c1021/tracker.jsonl
318+ check_metrics :
319+ grad_norm : 0.000001
320+ loss/reduced_llm_loss : 0.000001
321+ lr : 0
322+ memory/max_memory_GB : 0.2
323+ runtime_info/tgs : 0.05
324+ runtime_info/text_tokens : 0
325+ timeout : 10800
326+
327+ qwen3-5-sft-vl-moe :
328+ -
329+ type : sft
330+ parameters :
331+ config : autotest/config/qwen3_5_35B_sft_vl.py
332+ output_path : /mnt/shared-storage-user/llmrazor-share/qa-llm-cicd/test_output
333+ resource :
334+ cpus_per_task : 80
335+ envs :
336+ - MODEL_PATH=/mnt/shared-storage-user/llmrazor-share/model/Qwen3.5-35B-A3B
337+ - DATA_PATH=/mnt/shared-storage-user/llmrazor-share/data/ci_vl
338+ - MEDIA_ROOT=/mnt/shared-storage-user/llmrazor-share/data/ci_vl
339+ - XTUNER_DETERMINISTIC=true
340+ assert_info :
341+ base_metric : qwen3-5-sft-vl-moe/e968368a/tracker.jsonl
342+ check_metrics :
343+ grad_norm : 5
344+ loss/reduced_llm_loss : 5
345+ lr : 0
346+ memory/max_memory_GB : 0.2
347+ runtime_info/tgs : 0.05
348+ runtime_info/text_tokens : 0
349+ timeout : 10800
350+
351+ qwen3-5-sft-fp8 :
352+ -
353+ type : sft
354+ parameters :
355+ config : autotest/config/qwen3_5_fp8.py
356+ output_path : /mnt/shared-storage-user/llmrazor-share/qa-llm-cicd/test_output
357+ resource :
358+ num_nodes : 1
359+ cpus_per_task : 80
360+ envs :
361+ - QWEN3_MOE_PATH=/mnt/shared-storage-user/llmrazor-share/model/Qwen3.5-35B-A3B
362+ - ALPACA_PATH=/mnt/shared-storage-user/llmrazor-share/data/alpaca
363+ - XTUNER_DETERMINISTIC=true
364+ - XTUNER_ACTIVATION_OFFLOAD=1
365+ - XTUNER_USE_FA3=1
366+ assert_info :
367+ base_metric : qwen3-5-sft-fp8/625c0018/tracker.jsonl
368+ check_metrics :
369+ grad_norm : 0.1
370+ loss/reduced_llm_loss : 0.000001
371+ lr : 0
372+ memory/max_memory_GB : 0.2
373+ runtime_info/tgs : 0.05
374+ runtime_info/text_tokens : 0
375+ timeout : 10800
376+
377+ qwen3-5-sft-recompute :
378+ -
379+ type : sft
380+ parameters :
381+ config : autotest/config/qwen3_5_recompute.py
382+ output_path : /mnt/shared-storage-user/llmrazor-share/qa-llm-cicd/test_output
383+ resource :
384+ num_nodes : 2
385+ cpus_per_task : 80
386+ envs :
387+ - QWEN3_MOE_PATH=/mnt/shared-storage-user/llmrazor-share/model/Qwen3.5-35B-A3B
388+ - ALPACA_PATH=/mnt/shared-storage-user/llmrazor-share/data/alpaca
389+ - XTUNER_DETERMINISTIC=true
390+ assert_info :
391+ base_metric : qwen3-5-sft-recompute/625c0018/tracker.jsonl
392+ check_metrics :
393+ grad_norm : 0.000001
394+ loss/reduced_llm_loss : 0.000001
395+ lr : 0
396+ memory/max_memory_GB : 0.2
397+ runtime_info/tgs : 0.05
398+ runtime_info/text_tokens : 0
399+ timeout : 10800
400+
401+ qwen3-5-sft-tp2 :
402+ -
403+ type : sft
404+ parameters :
405+ config : autotest/config/qwen3_5_moe_30BA3_tp2.py
406+ output_path : /mnt/shared-storage-user/llmrazor-share/qa-llm-cicd/test_output
407+ resource :
408+ envs :
409+ - QWEN3_MOE_PATH=/mnt/shared-storage-user/llmrazor-share/model/Qwen3.5-35B-A3B
410+ - ALPACA_PATH=/mnt/shared-storage-user/llmrazor-share/data/alpaca
411+ - XTUNER_DETERMINISTIC=true
412+ assert_info :
413+ base_metric : qwen3-5-sft-tp2/625c0018/tracker.jsonl
414+ check_metrics :
415+ grad_norm : 0.05
416+ loss/reduced_llm_loss : 0.000001
417+ lr : 0
418+ memory/max_memory_GB : 0.2
419+ runtime_info/tgs : 0.05
420+ runtime_info/text_tokens : 0
421+ timeout : 10800
422+
423+ qwen3-5-sft-sp4-resume :
424+ -
425+ type : sft
426+ parameters :
427+ config : autotest/config/qwen3_5_moe_30BA3_sp4.py
428+ output_path : /mnt/shared-storage-user/llmrazor-share/qa-llm-cicd/test_output
429+ resource :
430+ envs :
431+ - QWEN3_MOE_PATH=/mnt/shared-storage-user/llmrazor-share/model/Qwen3.5-35B-A3B
432+ - ALPACA_PATH=/mnt/shared-storage-user/llmrazor-share/data/ci_resume
433+ - XTUNER_DETERMINISTIC=true
434+ assert_info :
435+ base_metric : qwen3-5-sft-sp4-resume/625c0018/tracker.jsonl
436+ check_metrics :
437+ grad_norm : 0.02
438+ loss/reduced_llm_loss : 0.000001
439+ lr : 0
440+ memory/max_memory_GB : 0.2
441+ runtime_info/tgs : 0.05
442+ runtime_info/text_tokens : 0
443+ timeout : 10800
444+
445+ -
446+ type : sft
447+ parameters :
448+ config : autotest/config/qwen3_5_moe_30BA3_sp4.py
449+ output_path : /mnt/shared-storage-user/llmrazor-share/qa-llm-cicd/test_output
450+ resource :
451+ memory_per_task : 1200
452+ envs :
453+ - QWEN3_MOE_PATH=/mnt/shared-storage-user/llmrazor-share/model/Qwen3.5-35B-A3B
454+ - ALPACA_PATH=/mnt/shared-storage-user/llmrazor-share/data/alpaca
455+ - XTUNER_DETERMINISTIC=true
456+ assert_info :
457+ base_metric : qwen3-5-sft-sp4-resume/625c0018_resume/tracker.jsonl
458+ check_metrics :
459+ grad_norm : 0.02
460+ loss/reduced_llm_loss : 0.000001
461+ lr : 0
462+ memory/max_memory_GB : 0.2
463+ runtime_info/tgs : 0.05
464+ runtime_info/text_tokens : 0
465+ timeout : 10800
466+
280467 qwen3-rl-lmdeploy :
281468 -
282469 type : rl
@@ -319,3 +506,47 @@ case:
319506 method : absolute
320507 operator : <
321508 timeout : 2460
509+
510+ qwen3-rl-vl-lmdeploy :
511+ -
512+ type : rl
513+ parameters :
514+ config : autotest/config/rl_qwen3_vl_geometry3k_grpo.py
515+ infer_backend : lmdeploy
516+ output_path : /mnt/shared-storage-user/llmrazor-share/qa-llm-cicd/test_output
517+ resource :
518+ envs :
519+ - MODEL_PATH=/mnt/shared-storage-user/llmrazor-share/model/Qwen3-VL-8B-Instruct
520+ - DATA_PATH=/mnt/shared-storage-user/llmrazor-share/data/less_geometry3k/train.jsonl
521+ - EVAL_DATA_PATH=/mnt/shared-storage-user/llmrazor-share/data/less_geometry3k/test.jsonl
522+ - MEDIA_ROOT=/mnt/shared-storage-user/llmrazor-share/data/less_geometry3k
523+ - XTUNER_DETERMINISTIC=true
524+ assert_info :
525+ base_metric : qwen3-rl-vl-lmdeploy/fb28789f/tracker.jsonl
526+ check_metrics :
527+ -
528+ metric : eval/accuracy
529+ threshold : 0.1
530+ method : absolute
531+ operator : <
532+ -
533+ metric : response/rewards/mean
534+ threshold : 0.1
535+ method : absolute
536+ operator : <
537+ -
538+ metric : mismatch/mismatch_k3_kl
539+ threshold : 0.0001
540+ method : absolute
541+ operator : <=
542+ -
543+ metric : response/response_len/mean
544+ threshold : 0.12
545+ method : relative
546+ operator : <
547+ -
548+ metric : time/step
549+ threshold : 10
550+ method : absolute
551+ operator : <
552+ timeout : 4200
0 commit comments