mirror of
https://github.com/volcengine/verl.git
synced 2025-10-20 13:43:50 +08:00
Commit Graph
Select branches
Hide Pull Requests
dependabot/pip/sglang-all--0.5.3.post1
dependabot/pip/torchvision-0.23.0
main
recipe/dapo
recipe/entropy-mechanism
recipe/one_step_off_async
revert-3769-fix-async-reward
v0.2.x
v0.3.x
v0.4.1.x
v0.4.x
v0.5.x
v0.6.x
wuxibin/fix_agent_loop
wuxibin/rollout_mode
#1
#100
#1001
#1005
#1006
#1006
#1007
#1009
#1010
#1012
#1016
#1018
#102
#1020
#1020
#1021
#1021
#1024
#1025
#1026
#1027
#1029
#103
#1030
#1032
#1034
#1035
#1037
#1038
#1040
#1040
#1041
#1042
#1044
#1044
#1045
#1046
#1047
#1048
#105
#1050
#1052
#1052
#1053
#1054
#1055
#1060
#1064
#1068
#1069
#107
#1071
#1072
#1073
#1074
#1075
#1078
#1081
#1082
#1085
#1086
#1087
#1088
#109
#1090
#1091
#1092
#1092
#1095
#1095
#1098
#1099
#110
#1100
#1101
#1103
#1104
#1105
#1107
#111
#1111
#1112
#1113
#1114
#1116
#1117
#1118
#112
#1123
#1123
#1124
#1124
#1125
#1127
#1128
#1128
#113
#1131
#1132
#1135
#1136
#1137
#1138
#1139
#114
#1140
#1143
#1146
#115
#1152
#1152
#1153
#1153
#1154
#1155
#1157
#1159
#116
#1160
#1161
#1162
#1164
#1168
#117
#1171
#1173
#1174
#1175
#1177
#1178
#1179
#118
#1180
#1181
#1184
#1185
#1186
#1190
#1195
#1198
#1199
#120
#1200
#1202
#1203
#1204
#1205
#1206
#1206
#1207
#121
#1211
#1212
#1215
#1217
#1219
#122
#1220
#1222
#1223
#1225
#1225
#1227
#1228
#1229
#123
#1230
#1231
#1231
#1234
#1234
#1236
#1237
#124
#1240
#1241
#1245
#1247
#1248
#125
#1250
#1252
#1253
#1254
#1256
#1258
#1259
#126
#1260
#1261
#1261
#1265
#1266
#1267
#1269
#127
#1271
#1272
#1274
#1275
#1276
#1277
#1278
#1279
#1279
#128
#1280
#1281
#1282
#1283
#1284
#1286
#1287
#1288
#1289
#129
#1290
#1292
#1294
#1295
#1295
#1296
#1296
#1297
#130
#1300
#1301
#1301
#1312
#1316
#1318
#1319
#1319
#132
#1320
#1323
#1324
#1325
#1327
#133
#1331
#1333
#1336
#1337
#1339
#1340
#1342
#1342
#1343
#1347
#1349
#1349
#135
#1350
#1351
#1353
#1355
#1356
#1358
#1358
#136
#1362
#1364
#1366
#1369
#137
#1370
#1372
#1373
#1374
#1378
#1379
#1385
#1387
#1389
#139
#1390
#1391
#1392
#1395
#1396
#1397
#140
#1400
#1401
#1404
#1405
#1406
#1407
#1408
#1409
#141
#1411
#1413
#1415
#1419
#142
#1421
#1423
#1424
#1429
#1432
#1433
#1434
#1435
#1437
#1439
#1440
#1441
#1442
#1443
#1444
#1445
#1449
#1450
#1451
#1453
#1454
#146
#1460
#1461
#1463
#1464
#1465
#1466
#1467
#1468
#147
#1470
#1475
#1479
#1480
#1482
#1483
#1488
#1489
#1489
#1490
#1490
#1491
#1494
#1495
#1497
#1499
#150
#1505
#1509
#1513
#1514
#1519
#1519
#152
#1520
#1522
#1523
#1525
#1527
#1529
#153
#1532
#1533
#1536
#1538
#1539
#1540
#1541
#1541
#1544
#1547
#1548
#1548
#1549
#1551
#1552
#1553
#1555
#1557
#1557
#1558
#1559
#156
#1562
#1564
#1566
#1567
#1568
#1571
#1577
#1582
#1583
#1585
#1586
#1587
#1588
#1591
#1592
#1593
#1594
#1596
#1597
#1598
#1600
#1601
#1602
#1604
#1606
#1607
#1608
#1609
#1610
#1612
#1613
#1616
#1617
#162
#1621
#1622
#1623
#1624
#1625
#1627
#1629
#163
#1630
#1631
#1634
#1637
#1638
#1639
#164
#1641
#1647
#1648
#165
#1650
#1651
#1652
#1653
#166
#1660
#1665
#1666
#1667
#1668
#1669
#167
#1670
#1671
#1672
#1673
#1678
#1681
#1682
#1685
#1686
#1686
#1687
#1688
#1689
#1690
#1693
#1693
#1694
#1697
#1698
#17
#1700
#1701
#1702
#1704
#1705
#1706
#1707
#1709
#1712
#1713
#1714
#1715
#1717
#1719
#1726
#1728
#1729
#173
#1730
#1731
#1732
#1737
#1738
#1739
#174
#1740
#1741
#1742
#1743
#1744
#1745
#1748
#1749
#175
#1750
#1753
#1754
#1754
#1755
#1756
#1760
#1761
#1762
#1763
#1765
#1766
#1767
#1768
#1769
#177
#1770
#1771
#1772
#1773
#1774
#1775
#1776
#1779
#178
#1781
#1786
#1786
#1787
#1788
#179
#1791
#1792
#1794
#1796
#1797
#1799
#18
#1805
#1806
#1807
#1808
#1809
#1810
#1811
#1812
#1813
#1814
#1816
#1817
#1818
#1819
#182
#1820
#1821
#1822
#1823
#1826
#1828
#1829
#183
#1830
#1831
#1832
#1833
#1834
#1835
#1835
#1836
#1838
#1839
#1840
#1841
#1843
#1844
#1846
#1847
#185
#1850
#1851
#1852
#1854
#1855
#1856
#1856
#1858
#1859
#186
#1861
#1862
#1866
#1867
#1868
#187
#1870
#1871
#1871
#1872
#1877
#1878
#1879
#1880
#1884
#1886
#1888
#1889
#1890
#1891
#1893
#1896
#1897
#1898
#1899
#19
#1900
#1901
#1904
#1905
#1906
#1907
#1908
#1909
#191
#1910
#1911
#1912
#1913
#1914
#1916
#1917
#1918
#192
#1920
#1922
#1924
#1925
#1927
#193
#1930
#1932
#1933
#1935
#194
#1942
#1943
#1944
#1945
#1946
#1947
#1948
#1949
#195
#1950
#1952
#1953
#1953
#1954
#1955
#1956
#1957
#1958
#1959
#196
#1961
#1965
#1968
#1969
#1971
#1971
#1972
#1974
#1977
#1979
#198
#198
#1981
#1983
#1985
#1987
#199
#1990
#1991
#1994
#1995
#1996
#1998
#1999
#2
#200
#2000
#2002
#2003
#2003
#2004
#2006
#2007
#2008
#201
#2010
#2014
#2016
#2017
#2018
#2019
#202
#2021
#2021
#2023
#2025
#2026
#2028
#2029
#203
#2033
#2035
#2036
#2037
#2039
#204
#2043
#2045
#2046
#2049
#205
#2050
#2051
#2052
#2053
#2054
#2056
#2056
#2057
#206
#2062
#2063
#2064
#2067
#2068
#207
#2070
#2071
#2071
#2072
#2074
#2075
#2075
#2076
#2076
#2077
#208
#2080
#2081
#2083
#2084
#2085
#2089
#209
#2090
#2091
#2092
#2094
#2097
#2097
#2098
#210
#2100
#2100
#2101
#2102
#2103
#2104
#2105
#2107
#2109
#2111
#2113
#2114
#2116
#2117
#2118
#2120
#2120
#2121
#2122
#2123
#2124
#2125
#2126
#2127
#213
#2130
#2131
#2132
#2132
#2135
#2135
#2137
#2138
#2139
#2139
#2141
#2142
#2142
#2143
#2144
#2144
#2146
#2147
#215
#2154
#2156
#2158
#2158
#216
#2161
#2162
#2163
#2164
#2169
#2170
#2172
#2173
#2173
#2174
#2176
#2178
#218
#2180
#2182
#2183
#2183
#2184
#2187
#219
#2190
#2191
#2192
#2194
#2199
#2199
#220
#2200
#2203
#2206
#2210
#2212
#2214
#2215
#2217
#2219
#2219
#222
#2220
#2220
#2224
#2226
#2227
#2229
#223
#2230
#2231
#2232
#2232
#2233
#2239
#2240
#2241
#2244
#2246
#2247
#2248
#2249
#225
#2251
#2253
#2255
#2256
#2257
#2258
#2259
#226
#2261
#2267
#2268
#2269
#2269
#2272
#2275
#228
#2281
#2284
#2287
#2288
#2289
#2290
#2291
#2292
#2293
#2295
#2297
#2297
#2298
#23
#230
#2303
#2307
#2308
#2308
#231
#2312
#2314
#2315
#2321
#2322
#2323
#2323
#2324
#2326
#2327
#2328
#2328
#233
#2330
#2331
#2332
#2334
#2334
#2335
#2336
#2337
#2338
#2338
#234
#2341
#2342
#2343
#2345
#2346
#2347
#2347
#2349
#235
#2350
#2352
#2353
#2354
#2358
#236
#2362
#2365
#2367
#2369
#237
#2370
#2371
#2372
#2374
#2375
#2376
#2377
#2378
#2379
#2381
#2381
#2382
#2383
#2385
#239
#2390
#2392
#2393
#2398
#240
#2400
#2403
#2404
#2407
#2409
#2410
#2412
#2418
#2421
#2428
#243
#2430
#2431
#2432
#2433
#2434
#2435
#2435
#2436
#2436
#2439
#244
#2440
#2442
#2444
#2444
#2446
#2446
#2451
#2452
#2454
#2454
#2455
#2456
#2459
#2460
#2461
#2462
#2463
#2465
#2466
#2466
#2467
#2468
#2469
#247
#247
#2470
#2472
#2472
#2473
#2474
#2475
#2475
#2476
#2477
#248
#2480
#2481
#2484
#2485
#2487
#2487
#2488
#2489
#2491
#2494
#2495
#2495
#2496
#2497
#2498
#2499
#2500
#2500
#2502
#2503
#2508
#2509
#2510
#2510
#2511
#2513
#2514
#2516
#2519
#2521
#2523
#2524
#2525
#2529
#2530
#2530
#2531
#2532
#2533
#2534
#2537
#254
#2541
#2542
#2543
#2545
#2548
#255
#2553
#2554
#2555
#2557
#2559
#256
#2560
#2561
#2563
#2567
#2568
#2569
#257
#2574
#2576
#2577
#258
#2580
#2582
#2583
#2585
#2587
#259
#2590
#2591
#2595
#2598
#260
#2602
#2604
#2605
#2605
#2606
#2607
#261
#2610
#2611
#2614
#2615
#2615
#2617
#2619
#262
#2620
#2621
#2622
#2623
#2623
#2624
#2629
#2629
#2630
#2632
#2634
#2635
#2636
#2637
#264
#2641
#2641
#2645
#2646
#2647
#2649
#2651
#2659
#266
#2664
#2665
#2666
#2667
#2668
#2669
#2670
#2671
#2672
#2675
#2676
#2678
#268
#2685
#2687
#2689
#2690
#2690
#2691
#2692
#2693
#2695
#2696
#2698
#2699
#27
#2700
#2701
#2707
#2709
#2711
#2714
#2715
#2716
#2717
#2718
#2719
#272
#2720
#2725
#2726
#2729
#2730
#2731
#2732
#2733
#2739
#274
#2740
#2741
#2745
#2746
#2747
#2748
#2748
#2749
#2750
#2754
#2757
#2759
#2761
#2762
#2763
#2764
#2765
#2768
#2771
#2772
#2773
#2774
#2774
#2775
#2777
#2782
#2784
#2786
#2787
#2788
#279
#2792
#2792
#2794
#2795
#2799
#2799
#28
#2800
#2805
#2806
#2808
#281
#2810
#2813
#2815
#2815
#2816
#2817
#2818
#282
#2821
#2823
#2824
#2827
#2831
#2835
#2835
#2836
#2838
#2839
#2839
#284
#2843
#2845
#2845
#2849
#2851
#2851
#2854
#2854
#2859
#286
#2861
#2861
#2864
#2866
#2868
#2869
#2870
#2871
#2874
#2875
#2875
#2878
#2878
#2880
#2881
#2882
#2883
#2884
#2885
#2887
#2888
#2888
#2893
#2894
#2895
#2896
#290
#2900
#2901
#2902
#2903
#2904
#2905
#2907
#2908
#291
#2912
#2915
#2915
#2924
#2925
#2926
#2927
#2929
#2931
#2933
#2936
#294
#2941
#2945
#2946
#2947
#2948
#2952
#2953
#2954
#2956
#2957
#2959
#2960
#2962
#2963
#2963
#2964
#2967
#2970
#2973
#2974
#2977
#2978
#2980
#2981
#2982
#2983
#2983
#2985
#2988
#2988
#2989
#2989
#299
#2990
#2990
#2993
#2998
#2999
#3
#30
#3000
#3001
#3004
#3006
#3007
#3009
#301
#3010
#3011
#3012
#3013
#3014
#3014
#3016
#3017
#3019
#3020
#3021
#3022
#3023
#3029
#303
#3031
#3034
#3036
#3037
#304
#3041
#3044
#3046
#3047
#3049
#305
#3051
#3052
#3053
#3054
#3055
#3059
#3060
#3063
#3066
#3068
#307
#3071
#3072
#3077
#3077
#3078
#308
#3082
#3083
#3084
#3084
#309
#3090
#3091
#3092
#3094
#3099
#31
#310
#3100
#3100
#3101
#3102
#3103
#3105
#3106
#3108
#3109
#3111
#3112
#3113
#3117
#3119
#3120
#3127
#3128
#313
#3131
#3132
#3133
#3134
#3135
#3136
#3138
#3139
#314
#3141
#3142
#3144
#3145
#3146
#3151
#3152
#3154
#3155
#3155
#3156
#3161
#3162
#3167
#3167
#3168
#3168
#317
#3171
#3174
#3175
#3177
#3178
#3179
#318
#3180
#3180
#3181
#3183
#3184
#3186
#3187
#3188
#3189
#3191
#3191
#3192
#3194
#3196
#3197
#3198
#32
#320
#3202
#3203
#3204
#3206
#3207
#3208
#3209
#321
#321
#3211
#3212
#3214
#3215
#3216
#3217
#3219
#322
#3221
#3222
#3224
#3225
#3227
#3228
#3229
#3229
#323
#3230
#3231
#3235
#3239
#3241
#3242
#3245
#3247
#3247
#325
#3251
#3252
#3259
#3259
#3260
#3261
#3268
#327
#3270
#3272
#3274
#3280
#3281
#3282
#3283
#3283
#3284
#3285
#3287
#3289
#329
#3291
#3294
#3294
#3295
#3297
#3297
#3298
#33
#330
#3300
#3301
#3303
#3304
#3306
#3307
#3309
#3310
#3312
#3313
#3314
#3315
#3317
#332
#3320
#3321
#3326
#3326
#3327
#3328
#333
#3330
#3331
#3332
#3333
#3336
#3341
#3343
#3344
#3345
#3347
#3348
#335
#3352
#3353
#3355
#3356
#3357
#3357
#3359
#3362
#3363
#3367
#3368
#3369
#3370
#3371
#3378
#3383
#3384
#3385
#3388
#3388
#3389
#3389
#339
#3390
#3394
#3395
#3397
#3397
#34
#3401
#3404
#3405
#3405
#3409
#341
#3410
#3411
#3414
#3417
#3422
#3423
#3425
#3427
#3427
#3429
#3429
#343
#3430
#3433
#3438
#3438
#3439
#3441
#3442
#3448
#3454
#3455
#3456
#3458
#346
#3460
#3460
#3461
#3465
#3465
#3467
#3467
#3471
#3472
#3473
#3475
#3475
#3479
#3479
#348
#3482
#3483
#3484
#3485
#3485
#3489
#3490
#3492
#3493
#3493
#3494
#3495
#3496
#3497
#3499
#35
#350
#3500
#3501
#3502
#3503
#3505
#3506
#3507
#3509
#351
#3511
#3513
#3514
#3519
#3519
#3520
#3522
#3522
#3523
#3523
#3524
#3526
#3527
#3528
#3529
#353
#3530
#3531
#3532
#3533
#3534
#3535
#3537
#3540
#3541
#3543
#3544
#3547
#3548
#3548
#3552
#3553
#3555
#3556
#3563
#3565
#3567
#357
#3570
#3571
#3572
#3573
#3574
#3576
#3577
#3578
#358
#3580
#3582
#3586
#3587
#3588
#3589
#359
#359
#3590
#3590
#3594
#3595
#3596
#3598
#3599
#36
#360
#3600
#3601
#3604
#3605
#3605
#3608
#361
#3610
#3610
#3611
#3613
#3614
#3616
#3617
#362
#3621
#3623
#3625
#3626
#3627
#3628
#3628
#363
#3630
#3631
#3635
#3637
#3637
#3639
#364
#364
#3640
#3641
#3644
#3648
#3649
#3649
#3651
#3651
#3653
#3655
#3656
#3656
#3657
#366
#3661
#3662
#3663
#3667
#3668
#3670
#3673
#3673
#3675
#3677
#3678
#3679
#3679
#368
#3681
#3682
#3682
#3684
#3685
#3686
#3687
#3688
#3689
#3690
#3690
#3691
#3691
#3692
#3694
#3698
#3699
#37
#370
#3700
#3701
#3702
#3703
#3705
#3706
#3710
#3710
#3712
#3713
#3713
#3716
#3718
#3722
#3724
#3724
#3725
#3726
#3728
#3728
#3729
#3729
#3732
#3734
#3735
#3736
#3738
#3739
#374
#3746
#3747
#3747
#3748
#3749
#3749
#3750
#3751
#3755
#3756
#3760
#3763
#3764
#3765
#3765
#3767
#3768
#3769
#377
#3770
#3771
#3772
#3773
#3774
#3777
#3778
#3779
#3780
#3781
#3782
#3786
#3789
#379
#3790
#3793
#3797
#3799
#38
#3803
#3804
#381
#3810
#3812
#3812
#3814
#3814
#3815
#3817
#3819
#382
#3820
#3821
#3824
#386
#389
#39
#391
#392
#396
#4
#402
#403
#404
#408
#409
#41
#416
#417
#419
#419
#423
#424
#425
#426
#427
#43
#432
#435
#436
#436
#437
#44
#440
#442
#443
#445
#448
#449
#45
#450
#451
#452
#454
#459
#461
#462
#463
#464
#465
#469
#47
#470
#474
#475
#476
#478
#480
#482
#483
#487
#489
#49
#490
#495
#497
#499
#50
#500
#504
#505
#506
#507
#508
#510
#511
#515
#515
#52
#520
#524
#527
#532
#534
#54
#541
#542
#543
#545
#547
#547
#549
#55
#551
#552
#553
#554
#556
#557
#558
#559
#56
#560
#561
#562
#563
#564
#565
#569
#57
#570
#575
#577
#58
#581
#583
#585
#586
#587
#588
#59
#590
#591
#592
#599
#60
#601
#601
#602
#603
#61
#610
#611
#612
#614
#615
#617
#618
#619
#620
#621
#622
#623
#624
#629
#63
#631
#634
#635
#639
#640
#641
#642
#644
#645
#646
#648
#65
#650
#652
#657
#662
#663
#664
#669
#67
#674
#675
#676
#677
#681
#683
#684
#686
#687
#688
#691
#694
#695
#7
#70
#704
#706
#71
#711
#712
#714
#715
#717
#718
#72
#722
#723
#724
#729
#732
#735
#736
#737
#738
#738
#74
#741
#743
#743
#745
#749
#75
#753
#754
#755
#756
#757
#757
#759
#759
#760
#761
#762
#763
#764
#765
#769
#772
#773
#776
#777
#780
#781
#782
#784
#786
#787
#788
#789
#79
#790
#792
#793
#794
#794
#797
#80
#800
#802
#808
#808
#809
#81
#810
#810
#811
#812
#812
#813
#814
#818
#819
#820
#822
#824
#826
#828
#829
#83
#832
#833
#838
#84
#840
#844
#845
#846
#85
#850
#851
#852
#853
#854
#857
#858
#86
#861
#865
#866
#867
#868
#869
#871
#872
#875
#878
#879
#88
#881
#882
#883
#884
#885
#886
#887
#889
#89
#890
#893
#894
#9
#90
#902
#906
#908
#909
#91
#910
#912
#915
#916
#917
#918
#92
#921
#922
#923
#924
#925
#927
#929
#930
#931
#934
#938
#94
#941
#942
#944
#945
#947
#948
#948
#951
#954
#955
#955
#956
#956
#958
#959
#960
#962
#963
#969
#970
#971
#972
#973
#973
#975
#976
#978
#979
#98
#982
#983
#984
#986
#987
#989
#99
#990
#996
#998
v0.1
v0.1rc
v0.2
v0.2.0.post1
v0.2.0.post2
v0.3.0.post0
v0.3.0.post1
v0.3.0.rc0
v0.4.0
v0.4.1
v0.5.0
v0.6.0
Select branches
Hide Pull Requests
dependabot/pip/sglang-all--0.5.3.post1
dependabot/pip/torchvision-0.23.0
main
recipe/dapo
recipe/entropy-mechanism
recipe/one_step_off_async
revert-3769-fix-async-reward
v0.2.x
v0.3.x
v0.4.1.x
v0.4.x
v0.5.x
v0.6.x
wuxibin/fix_agent_loop
wuxibin/rollout_mode
#1
#100
#1001
#1005
#1006
#1006
#1007
#1009
#1010
#1012
#1016
#1018
#102
#1020
#1020
#1021
#1021
#1024
#1025
#1026
#1027
#1029
#103
#1030
#1032
#1034
#1035
#1037
#1038
#1040
#1040
#1041
#1042
#1044
#1044
#1045
#1046
#1047
#1048
#105
#1050
#1052
#1052
#1053
#1054
#1055
#1060
#1064
#1068
#1069
#107
#1071
#1072
#1073
#1074
#1075
#1078
#1081
#1082
#1085
#1086
#1087
#1088
#109
#1090
#1091
#1092
#1092
#1095
#1095
#1098
#1099
#110
#1100
#1101
#1103
#1104
#1105
#1107
#111
#1111
#1112
#1113
#1114
#1116
#1117
#1118
#112
#1123
#1123
#1124
#1124
#1125
#1127
#1128
#1128
#113
#1131
#1132
#1135
#1136
#1137
#1138
#1139
#114
#1140
#1143
#1146
#115
#1152
#1152
#1153
#1153
#1154
#1155
#1157
#1159
#116
#1160
#1161
#1162
#1164
#1168
#117
#1171
#1173
#1174
#1175
#1177
#1178
#1179
#118
#1180
#1181
#1184
#1185
#1186
#1190
#1195
#1198
#1199
#120
#1200
#1202
#1203
#1204
#1205
#1206
#1206
#1207
#121
#1211
#1212
#1215
#1217
#1219
#122
#1220
#1222
#1223
#1225
#1225
#1227
#1228
#1229
#123
#1230
#1231
#1231
#1234
#1234
#1236
#1237
#124
#1240
#1241
#1245
#1247
#1248
#125
#1250
#1252
#1253
#1254
#1256
#1258
#1259
#126
#1260
#1261
#1261
#1265
#1266
#1267
#1269
#127
#1271
#1272
#1274
#1275
#1276
#1277
#1278
#1279
#1279
#128
#1280
#1281
#1282
#1283
#1284
#1286
#1287
#1288
#1289
#129
#1290
#1292
#1294
#1295
#1295
#1296
#1296
#1297
#130
#1300
#1301
#1301
#1312
#1316
#1318
#1319
#1319
#132
#1320
#1323
#1324
#1325
#1327
#133
#1331
#1333
#1336
#1337
#1339
#1340
#1342
#1342
#1343
#1347
#1349
#1349
#135
#1350
#1351
#1353
#1355
#1356
#1358
#1358
#136
#1362
#1364
#1366
#1369
#137
#1370
#1372
#1373
#1374
#1378
#1379
#1385
#1387
#1389
#139
#1390
#1391
#1392
#1395
#1396
#1397
#140
#1400
#1401
#1404
#1405
#1406
#1407
#1408
#1409
#141
#1411
#1413
#1415
#1419
#142
#1421
#1423
#1424
#1429
#1432
#1433
#1434
#1435
#1437
#1439
#1440
#1441
#1442
#1443
#1444
#1445
#1449
#1450
#1451
#1453
#1454
#146
#1460
#1461
#1463
#1464
#1465
#1466
#1467
#1468
#147
#1470
#1475
#1479
#1480
#1482
#1483
#1488
#1489
#1489
#1490
#1490
#1491
#1494
#1495
#1497
#1499
#150
#1505
#1509
#1513
#1514
#1519
#1519
#152
#1520
#1522
#1523
#1525
#1527
#1529
#153
#1532
#1533
#1536
#1538
#1539
#1540
#1541
#1541
#1544
#1547
#1548
#1548
#1549
#1551
#1552
#1553
#1555
#1557
#1557
#1558
#1559
#156
#1562
#1564
#1566
#1567
#1568
#1571
#1577
#1582
#1583
#1585
#1586
#1587
#1588
#1591
#1592
#1593
#1594
#1596
#1597
#1598
#1600
#1601
#1602
#1604
#1606
#1607
#1608
#1609
#1610
#1612
#1613
#1616
#1617
#162
#1621
#1622
#1623
#1624
#1625
#1627
#1629
#163
#1630
#1631
#1634
#1637
#1638
#1639
#164
#1641
#1647
#1648
#165
#1650
#1651
#1652
#1653
#166
#1660
#1665
#1666
#1667
#1668
#1669
#167
#1670
#1671
#1672
#1673
#1678
#1681
#1682
#1685
#1686
#1686
#1687
#1688
#1689
#1690
#1693
#1693
#1694
#1697
#1698
#17
#1700
#1701
#1702
#1704
#1705
#1706
#1707
#1709
#1712
#1713
#1714
#1715
#1717
#1719
#1726
#1728
#1729
#173
#1730
#1731
#1732
#1737
#1738
#1739
#174
#1740
#1741
#1742
#1743
#1744
#1745
#1748
#1749
#175
#1750
#1753
#1754
#1754
#1755
#1756
#1760
#1761
#1762
#1763
#1765
#1766
#1767
#1768
#1769
#177
#1770
#1771
#1772
#1773
#1774
#1775
#1776
#1779
#178
#1781
#1786
#1786
#1787
#1788
#179
#1791
#1792
#1794
#1796
#1797
#1799
#18
#1805
#1806
#1807
#1808
#1809
#1810
#1811
#1812
#1813
#1814
#1816
#1817
#1818
#1819
#182
#1820
#1821
#1822
#1823
#1826
#1828
#1829
#183
#1830
#1831
#1832
#1833
#1834
#1835
#1835
#1836
#1838
#1839
#1840
#1841
#1843
#1844
#1846
#1847
#185
#1850
#1851
#1852
#1854
#1855
#1856
#1856
#1858
#1859
#186
#1861
#1862
#1866
#1867
#1868
#187
#1870
#1871
#1871
#1872
#1877
#1878
#1879
#1880
#1884
#1886
#1888
#1889
#1890
#1891
#1893
#1896
#1897
#1898
#1899
#19
#1900
#1901
#1904
#1905
#1906
#1907
#1908
#1909
#191
#1910
#1911
#1912
#1913
#1914
#1916
#1917
#1918
#192
#1920
#1922
#1924
#1925
#1927
#193
#1930
#1932
#1933
#1935
#194
#1942
#1943
#1944
#1945
#1946
#1947
#1948
#1949
#195
#1950
#1952
#1953
#1953
#1954
#1955
#1956
#1957
#1958
#1959
#196
#1961
#1965
#1968
#1969
#1971
#1971
#1972
#1974
#1977
#1979
#198
#198
#1981
#1983
#1985
#1987
#199
#1990
#1991
#1994
#1995
#1996
#1998
#1999
#2
#200
#2000
#2002
#2003
#2003
#2004
#2006
#2007
#2008
#201
#2010
#2014
#2016
#2017
#2018
#2019
#202
#2021
#2021
#2023
#2025
#2026
#2028
#2029
#203
#2033
#2035
#2036
#2037
#2039
#204
#2043
#2045
#2046
#2049
#205
#2050
#2051
#2052
#2053
#2054
#2056
#2056
#2057
#206
#2062
#2063
#2064
#2067
#2068
#207
#2070
#2071
#2071
#2072
#2074
#2075
#2075
#2076
#2076
#2077
#208
#2080
#2081
#2083
#2084
#2085
#2089
#209
#2090
#2091
#2092
#2094
#2097
#2097
#2098
#210
#2100
#2100
#2101
#2102
#2103
#2104
#2105
#2107
#2109
#2111
#2113
#2114
#2116
#2117
#2118
#2120
#2120
#2121
#2122
#2123
#2124
#2125
#2126
#2127
#213
#2130
#2131
#2132
#2132
#2135
#2135
#2137
#2138
#2139
#2139
#2141
#2142
#2142
#2143
#2144
#2144
#2146
#2147
#215
#2154
#2156
#2158
#2158
#216
#2161
#2162
#2163
#2164
#2169
#2170
#2172
#2173
#2173
#2174
#2176
#2178
#218
#2180
#2182
#2183
#2183
#2184
#2187
#219
#2190
#2191
#2192
#2194
#2199
#2199
#220
#2200
#2203
#2206
#2210
#2212
#2214
#2215
#2217
#2219
#2219
#222
#2220
#2220
#2224
#2226
#2227
#2229
#223
#2230
#2231
#2232
#2232
#2233
#2239
#2240
#2241
#2244
#2246
#2247
#2248
#2249
#225
#2251
#2253
#2255
#2256
#2257
#2258
#2259
#226
#2261
#2267
#2268
#2269
#2269
#2272
#2275
#228
#2281
#2284
#2287
#2288
#2289
#2290
#2291
#2292
#2293
#2295
#2297
#2297
#2298
#23
#230
#2303
#2307
#2308
#2308
#231
#2312
#2314
#2315
#2321
#2322
#2323
#2323
#2324
#2326
#2327
#2328
#2328
#233
#2330
#2331
#2332
#2334
#2334
#2335
#2336
#2337
#2338
#2338
#234
#2341
#2342
#2343
#2345
#2346
#2347
#2347
#2349
#235
#2350
#2352
#2353
#2354
#2358
#236
#2362
#2365
#2367
#2369
#237
#2370
#2371
#2372
#2374
#2375
#2376
#2377
#2378
#2379
#2381
#2381
#2382
#2383
#2385
#239
#2390
#2392
#2393
#2398
#240
#2400
#2403
#2404
#2407
#2409
#2410
#2412
#2418
#2421
#2428
#243
#2430
#2431
#2432
#2433
#2434
#2435
#2435
#2436
#2436
#2439
#244
#2440
#2442
#2444
#2444
#2446
#2446
#2451
#2452
#2454
#2454
#2455
#2456
#2459
#2460
#2461
#2462
#2463
#2465
#2466
#2466
#2467
#2468
#2469
#247
#247
#2470
#2472
#2472
#2473
#2474
#2475
#2475
#2476
#2477
#248
#2480
#2481
#2484
#2485
#2487
#2487
#2488
#2489
#2491
#2494
#2495
#2495
#2496
#2497
#2498
#2499
#2500
#2500
#2502
#2503
#2508
#2509
#2510
#2510
#2511
#2513
#2514
#2516
#2519
#2521
#2523
#2524
#2525
#2529
#2530
#2530
#2531
#2532
#2533
#2534
#2537
#254
#2541
#2542
#2543
#2545
#2548
#255
#2553
#2554
#2555
#2557
#2559
#256
#2560
#2561
#2563
#2567
#2568
#2569
#257
#2574
#2576
#2577
#258
#2580
#2582
#2583
#2585
#2587
#259
#2590
#2591
#2595
#2598
#260
#2602
#2604
#2605
#2605
#2606
#2607
#261
#2610
#2611
#2614
#2615
#2615
#2617
#2619
#262
#2620
#2621
#2622
#2623
#2623
#2624
#2629
#2629
#2630
#2632
#2634
#2635
#2636
#2637
#264
#2641
#2641
#2645
#2646
#2647
#2649
#2651
#2659
#266
#2664
#2665
#2666
#2667
#2668
#2669
#2670
#2671
#2672
#2675
#2676
#2678
#268
#2685
#2687
#2689
#2690
#2690
#2691
#2692
#2693
#2695
#2696
#2698
#2699
#27
#2700
#2701
#2707
#2709
#2711
#2714
#2715
#2716
#2717
#2718
#2719
#272
#2720
#2725
#2726
#2729
#2730
#2731
#2732
#2733
#2739
#274
#2740
#2741
#2745
#2746
#2747
#2748
#2748
#2749
#2750
#2754
#2757
#2759
#2761
#2762
#2763
#2764
#2765
#2768
#2771
#2772
#2773
#2774
#2774
#2775
#2777
#2782
#2784
#2786
#2787
#2788
#279
#2792
#2792
#2794
#2795
#2799
#2799
#28
#2800
#2805
#2806
#2808
#281
#2810
#2813
#2815
#2815
#2816
#2817
#2818
#282
#2821
#2823
#2824
#2827
#2831
#2835
#2835
#2836
#2838
#2839
#2839
#284
#2843
#2845
#2845
#2849
#2851
#2851
#2854
#2854
#2859
#286
#2861
#2861
#2864
#2866
#2868
#2869
#2870
#2871
#2874
#2875
#2875
#2878
#2878
#2880
#2881
#2882
#2883
#2884
#2885
#2887
#2888
#2888
#2893
#2894
#2895
#2896
#290
#2900
#2901
#2902
#2903
#2904
#2905
#2907
#2908
#291
#2912
#2915
#2915
#2924
#2925
#2926
#2927
#2929
#2931
#2933
#2936
#294
#2941
#2945
#2946
#2947
#2948
#2952
#2953
#2954
#2956
#2957
#2959
#2960
#2962
#2963
#2963
#2964
#2967
#2970
#2973
#2974
#2977
#2978
#2980
#2981
#2982
#2983
#2983
#2985
#2988
#2988
#2989
#2989
#299
#2990
#2990
#2993
#2998
#2999
#3
#30
#3000
#3001
#3004
#3006
#3007
#3009
#301
#3010
#3011
#3012
#3013
#3014
#3014
#3016
#3017
#3019
#3020
#3021
#3022
#3023
#3029
#303
#3031
#3034
#3036
#3037
#304
#3041
#3044
#3046
#3047
#3049
#305
#3051
#3052
#3053
#3054
#3055
#3059
#3060
#3063
#3066
#3068
#307
#3071
#3072
#3077
#3077
#3078
#308
#3082
#3083
#3084
#3084
#309
#3090
#3091
#3092
#3094
#3099
#31
#310
#3100
#3100
#3101
#3102
#3103
#3105
#3106
#3108
#3109
#3111
#3112
#3113
#3117
#3119
#3120
#3127
#3128
#313
#3131
#3132
#3133
#3134
#3135
#3136
#3138
#3139
#314
#3141
#3142
#3144
#3145
#3146
#3151
#3152
#3154
#3155
#3155
#3156
#3161
#3162
#3167
#3167
#3168
#3168
#317
#3171
#3174
#3175
#3177
#3178
#3179
#318
#3180
#3180
#3181
#3183
#3184
#3186
#3187
#3188
#3189
#3191
#3191
#3192
#3194
#3196
#3197
#3198
#32
#320
#3202
#3203
#3204
#3206
#3207
#3208
#3209
#321
#321
#3211
#3212
#3214
#3215
#3216
#3217
#3219
#322
#3221
#3222
#3224
#3225
#3227
#3228
#3229
#3229
#323
#3230
#3231
#3235
#3239
#3241
#3242
#3245
#3247
#3247
#325
#3251
#3252
#3259
#3259
#3260
#3261
#3268
#327
#3270
#3272
#3274
#3280
#3281
#3282
#3283
#3283
#3284
#3285
#3287
#3289
#329
#3291
#3294
#3294
#3295
#3297
#3297
#3298
#33
#330
#3300
#3301
#3303
#3304
#3306
#3307
#3309
#3310
#3312
#3313
#3314
#3315
#3317
#332
#3320
#3321
#3326
#3326
#3327
#3328
#333
#3330
#3331
#3332
#3333
#3336
#3341
#3343
#3344
#3345
#3347
#3348
#335
#3352
#3353
#3355
#3356
#3357
#3357
#3359
#3362
#3363
#3367
#3368
#3369
#3370
#3371
#3378
#3383
#3384
#3385
#3388
#3388
#3389
#3389
#339
#3390
#3394
#3395
#3397
#3397
#34
#3401
#3404
#3405
#3405
#3409
#341
#3410
#3411
#3414
#3417
#3422
#3423
#3425
#3427
#3427
#3429
#3429
#343
#3430
#3433
#3438
#3438
#3439
#3441
#3442
#3448
#3454
#3455
#3456
#3458
#346
#3460
#3460
#3461
#3465
#3465
#3467
#3467
#3471
#3472
#3473
#3475
#3475
#3479
#3479
#348
#3482
#3483
#3484
#3485
#3485
#3489
#3490
#3492
#3493
#3493
#3494
#3495
#3496
#3497
#3499
#35
#350
#3500
#3501
#3502
#3503
#3505
#3506
#3507
#3509
#351
#3511
#3513
#3514
#3519
#3519
#3520
#3522
#3522
#3523
#3523
#3524
#3526
#3527
#3528
#3529
#353
#3530
#3531
#3532
#3533
#3534
#3535
#3537
#3540
#3541
#3543
#3544
#3547
#3548
#3548
#3552
#3553
#3555
#3556
#3563
#3565
#3567
#357
#3570
#3571
#3572
#3573
#3574
#3576
#3577
#3578
#358
#3580
#3582
#3586
#3587
#3588
#3589
#359
#359
#3590
#3590
#3594
#3595
#3596
#3598
#3599
#36
#360
#3600
#3601
#3604
#3605
#3605
#3608
#361
#3610
#3610
#3611
#3613
#3614
#3616
#3617
#362
#3621
#3623
#3625
#3626
#3627
#3628
#3628
#363
#3630
#3631
#3635
#3637
#3637
#3639
#364
#364
#3640
#3641
#3644
#3648
#3649
#3649
#3651
#3651
#3653
#3655
#3656
#3656
#3657
#366
#3661
#3662
#3663
#3667
#3668
#3670
#3673
#3673
#3675
#3677
#3678
#3679
#3679
#368
#3681
#3682
#3682
#3684
#3685
#3686
#3687
#3688
#3689
#3690
#3690
#3691
#3691
#3692
#3694
#3698
#3699
#37
#370
#3700
#3701
#3702
#3703
#3705
#3706
#3710
#3710
#3712
#3713
#3713
#3716
#3718
#3722
#3724
#3724
#3725
#3726
#3728
#3728
#3729
#3729
#3732
#3734
#3735
#3736
#3738
#3739
#374
#3746
#3747
#3747
#3748
#3749
#3749
#3750
#3751
#3755
#3756
#3760
#3763
#3764
#3765
#3765
#3767
#3768
#3769
#377
#3770
#3771
#3772
#3773
#3774
#3777
#3778
#3779
#3780
#3781
#3782
#3786
#3789
#379
#3790
#3793
#3797
#3799
#38
#3803
#3804
#381
#3810
#3812
#3812
#3814
#3814
#3815
#3817
#3819
#382
#3820
#3821
#3824
#386
#389
#39
#391
#392
#396
#4
#402
#403
#404
#408
#409
#41
#416
#417
#419
#419
#423
#424
#425
#426
#427
#43
#432
#435
#436
#436
#437
#44
#440
#442
#443
#445
#448
#449
#45
#450
#451
#452
#454
#459
#461
#462
#463
#464
#465
#469
#47
#470
#474
#475
#476
#478
#480
#482
#483
#487
#489
#49
#490
#495
#497
#499
#50
#500
#504
#505
#506
#507
#508
#510
#511
#515
#515
#52
#520
#524
#527
#532
#534
#54
#541
#542
#543
#545
#547
#547
#549
#55
#551
#552
#553
#554
#556
#557
#558
#559
#56
#560
#561
#562
#563
#564
#565
#569
#57
#570
#575
#577
#58
#581
#583
#585
#586
#587
#588
#59
#590
#591
#592
#599
#60
#601
#601
#602
#603
#61
#610
#611
#612
#614
#615
#617
#618
#619
#620
#621
#622
#623
#624
#629
#63
#631
#634
#635
#639
#640
#641
#642
#644
#645
#646
#648
#65
#650
#652
#657
#662
#663
#664
#669
#67
#674
#675
#676
#677
#681
#683
#684
#686
#687
#688
#691
#694
#695
#7
#70
#704
#706
#71
#711
#712
#714
#715
#717
#718
#72
#722
#723
#724
#729
#732
#735
#736
#737
#738
#738
#74
#741
#743
#743
#745
#749
#75
#753
#754
#755
#756
#757
#757
#759
#759
#760
#761
#762
#763
#764
#765
#769
#772
#773
#776
#777
#780
#781
#782
#784
#786
#787
#788
#789
#79
#790
#792
#793
#794
#794
#797
#80
#800
#802
#808
#808
#809
#81
#810
#810
#811
#812
#812
#813
#814
#818
#819
#820
#822
#824
#826
#828
#829
#83
#832
#833
#838
#84
#840
#844
#845
#846
#85
#850
#851
#852
#853
#854
#857
#858
#86
#861
#865
#866
#867
#868
#869
#871
#872
#875
#878
#879
#88
#881
#882
#883
#884
#885
#886
#887
#889
#89
#890
#893
#894
#9
#90
#902
#906
#908
#909
#91
#910
#912
#915
#916
#917
#918
#92
#921
#922
#923
#924
#925
#927
#929
#930
#931
#934
#938
#94
#941
#942
#944
#945
#947
#948
#948
#951
#954
#955
#955
#956
#956
#958
#959
#960
#962
#963
#969
#970
#971
#972
#973
#973
#975
#976
#978
#979
#98
#982
#983
#984
#986
#987
#989
#99
#990
#996
#998
v0.1
v0.1rc
v0.2
v0.2.0.post1
v0.2.0.post2
v0.3.0.post0
v0.3.0.post1
v0.3.0.rc0
v0.4.0
v0.4.1
v0.5.0
v0.6.0
-
2e1a1a6603
[BREAKING] [rollout] chore: remove default rollout selection (#2757)
Chi Zhang
2025-07-27 01:11:24 +08:00 -
ea4442470e
[algo] refactor: don't special-case
compute_policy_loss
(#2701)Frederick Robinson
2025-07-26 10:09:42 -07:00 -
0f5ab5c854
[doc] feat: add retool blog (#2761)
H
2025-07-25 22:13:55 -07:00 -
92e81cfcfd
[perf] feat: add optional role selection in discrete mode for NPU Profiler (#2750)
YumiMom
2025-07-25 21:53:09 +08:00 -
f107800837
[rollout] feat: remove chat scheduler (#2725)
Joel
2025-07-25 21:46:35 +08:00 -
58d698e04b
[trainer] refactor: Make sure to keep the type checking (#2634)
Yeonwoo Sung
2025-07-25 14:32:07 +09:00 -
caec858ebb
[doc] style: change resize handle from gradient to plain color (#2746)
Tingberer
2025-07-25 12:20:07 +08:00 -
f407887414
[CI] feat: add
mypy
to pre-commit (#2614)Frederick Robinson
2025-07-24 20:36:34 -07:00 -
dc8b5076c3
[megatron] feat: a bunch of optimzation on vram, sequence packing (#2678)
Yan Bai
2025-07-25 10:34:33 +08:00 -
4879d619fc
[docker] feat: upgrade to torch 2.7, sglang 0.4.8 (#2617)
Blue Space
2025-07-25 05:53:24 +08:00 -
bcd336fd46
[doc] feat: add resizable sidebar and improve layout (#2577)
Tingberer
2025-07-25 05:46:38 +08:00 -
1df03f3abf
[ci] fix: release ascend test time, fix one step off-policy CI (#2731)
Blue Space
2025-07-24 16:58:16 +08:00 -
a0248a8f17
[recipe] chore: add retool training script (#2732)
Joel
2025-07-24 16:34:10 +08:00 -
8adcffa25a
[ci] fix: checkpoint_convertor ci miss a hf model download (#2730)
Blue Space
2025-07-24 15:56:08 +08:00 -
88c084c4f3
[doc] feat: Add agent-lightning in the list of "awesome works using verl (#2726)
Wang Zilong
2025-07-24 14:49:27 +08:00 -
dc3015e9af
[tool] fix: geo3k create return str instead of tuple (#2714)
Nan Jiang
2025-07-23 22:56:13 -07:00 -
73fc53f600
[megatron] fix: resolve backward propagation error in megatron_actor due to shared logits tensor in-place modification (#2484)
Bowei Song
2025-07-24 13:37:18 +08:00 -
d57bfb02b3
[misc] chore: bump main branch version to v0.5.0.dev (#2718)
H
2025-07-23 19:46:16 -07:00 -
0eed7124fc
[sglang] fix: Adding strict naming sanity for sglang (#2719)
Chayenne
2025-07-24 10:45:57 +08:00 -
1862f748e5
[ray] feat: RayWorkerGroup support set worker env (#2685)
Jason Chen
2025-07-24 10:07:35 +08:00 -
6a9a1b872d
[ci] test: add CriticWorker unit test, make some util CPU friendly (#2717)
H
2025-07-23 15:36:10 -07:00 -
4de3ecf0f0
[cfg] refactor: add ActorConfig, EngineConfig, and ActorWorker unit test, refactor validation code (#2621)
H
2025-07-23 11:45:14 -07:00 -
8fdc4d3f20
[misc] chore: bump version to v0.5.0 (#2716)
v0.5.0
H
2025-07-23 10:57:10 -07:00 -
e13863e463
[ci] fix: auto-download model in Megatron-related CI tests (#2698)
Shawn/Yuxuan Tong
2025-07-24 01:49:09 +08:00 -
f926dc90b0
[sglang] fix: fix is_vlm issue (issue #2639) (#2667)
Nan Jiang
2025-07-23 10:45:57 -07:00 -
4ed106698b
[megatron] fix: CUDA_DEVICE_MAX_CONNECTIONS in ray error (#2709)
Blue Space
2025-07-23 18:57:57 +08:00 -
5bfb58e35d
[recipe] fix: fix dapo cannot save the checkpoint of last step (#2619)
Zhirong Chen
2025-07-23 17:26:35 +08:00 -
e9072c58fa
[ci] feat: CI request via Feishu (#2699)
Shawn/Yuxuan Tong
2025-07-23 14:54:15 +08:00 -
0404956290
[training_utils] fix: align tensorboard default dir for val_log_generation (#2696)
Xihuai Wang
2025-07-23 14:09:58 +08:00 -
c95c9ef701
[fsdp,megatron,sglang] fix: Fix torch reduce to speed up update weights (#2692)
Stefan He
2025-07-22 22:40:41 -07:00 -
dc1599b7e4
[rollout] fix: bug in init_engine Method of AsyncSglangServer (#2664)
OC
2025-07-23 13:09:37 +08:00 -
4792b70dd4
[megatron] fix: reset recompute_granularity and add backward compatibility fix (#2693)
Blue Space
2025-07-23 11:16:23 +08:00 -
4c10dddf74
[fsdp] fix: use torch 2.7 state dict api for torch 2.6 to resolve OOM (#2606)
Wei (Will) Feng
2025-07-22 19:54:33 -07:00 -
d20e5e07e1
[fsdp, ckpt] fix: Wrap
GenerationConfig.from_pretrained
with try-except to avoid crashes. (#2659)rj42
2025-07-23 05:18:35 +03:00 -
8888122a89
[megatron] fix: remove the demising model.enable_gradient_checkpointing flags in the script (#2691)
H
2025-07-22 18:25:30 -07:00 -
f252da34cf
[megatron] fix: CUDA_DEVICE_MAX_CONNECTIONS not taking effect (#2687)
Blue Space
2025-07-22 20:51:12 +08:00 -
244481ac8f
[misc] fix: main pre-commit and API change (#2675)
Blue Space
2025-07-22 15:01:20 +08:00 -
c5b189a1af
[BREAKING][megatron] refactor: activation checkpointing APIs (#2651)
Blue Space
2025-07-22 10:24:28 +08:00 -
72cae971d0
[sglang] fix: rename Sglang to SGLang following SGLang's fashion (#2672)
Chayenne
2025-07-22 09:11:20 +08:00 -
d062314a18
[data, recipe] fix: remove redundant json parsing (#2671)
Zhihui Xie
2025-07-21 18:09:10 -07:00 -
2bcc5d1212
[misc] fix: fix prompt and response key in gemma7b example (#2610)
Lin Yuan
2025-07-21 16:06:52 -07:00 -
e5f0b2aa80
[perf] feat: mistral and gemma3_text mfu compute support (#2622)
Xihuai Wang
2025-07-21 16:54:11 +08:00 -
ac826e0558
[tool] chore: Add log for AsyncRolloutRequest ID, and rollout viewr to support request id display and search (#2636)
Hecate
2025-07-20 21:01:37 -07:00 -
3f6cd47926
[rollout,vllm] fix: A major issue in random sampling of vllm engine (#2646)
Guanning Zeng
2025-07-21 00:00:28 -04:00 -
ac414d95c4
[recipe] feat: add QWen 30b moe dapo script that can run on a single 80GB node (#2645)
Chi Zhang
2025-07-21 09:49:21 +08:00 -
5d5ae81cdb
[sglang] fix: update response handling and scoring method in GSM8K interaction (#2428)
Aaron Yee
2025-07-21 08:06:46 +08:00 -
fcb1e191b7
[doc] fix: non-standardized path references (#2637)
beep-bebop
2025-07-20 18:49:16 +08:00 -
7fc3029a1e
[doc] fix: add options to enable agent loop (#2624)
OC
2025-07-20 06:03:06 +08:00 -
5d52d15fd3
[trainer] feat: Add FSDPCheckpointManager for SFTtrainer, support resume training, manage the number of CKPTS in keep (#2292)
shaofei hu
2025-07-19 12:15:23 +08:00 -
69a467f934
[docker] fix: downgrade TransformerEngine version 2.2.1 to allow mcore image using rope fusion and provide another set of v0.5 image (#2611)
Blue Space
2025-07-18 17:23:19 +08:00 -
9d7cba4e12
[trainer] refactor: Training Engine Interface and Development Plan (#1977)
Ziheng Jiang
2025-07-17 22:05:21 -07:00 -
223caf7022
[single_controller] fix: padding for kwargs (#2585)
Le Xue
2025-07-18 10:10:49 +08:00 -
fb810355f3
[tool] fix: supports variable arguments for marked_timer (#2576)
X. HU
2025-07-18 04:35:36 +08:00 -
2b2aa9d3fd
[tool] chore: introduce RolloutViewer TUI tools (#2469)
杨睿
2025-07-18 04:30:41 +08:00 -
7459131411
[hardware] refactor: replace device_name with config.trainer.device (#2542)
Cheetah
2025-07-18 04:29:01 +08:00 -
2adedb77b4
[doc] chore: add agent loop design doc (#2598)
Joel
2025-07-18 04:27:27 +08:00 -
332c7d53c1
[cfg] refactor: add flatten megatron trainer config generation and verification script (#2582)
H
2025-07-17 08:08:45 -07:00 -
0b62a6ece1
[cfg] feat: add critic config class (#2583)
H
2025-07-17 00:59:47 -07:00 -
40d638c63b
[doc] fix: typo in perf_tuning.rst (#2590)
Xihuai Wang
2025-07-17 15:58:34 +08:00 -
648e3c95cc
[doc] fix: fix some contents for one step off policy (#2591)
meituan-search
2025-07-17 15:54:06 +08:00 -
1775bd638f
[trainer] fix: maybe_filter_out_long_prompts on image and video (#2553)
Qifan Zhang
2025-07-17 14:17:20 +08:00 -
d51c52f754
[ci] chore: add codeowner for role/engine (#2587)
H
2025-07-16 22:05:04 -07:00 -
64601e418c
set use_kl_in_reward=True in reinforce_plus_plus (#2580)
Titanpku
2025-07-17 12:10:54 +08:00 -
503ea75f53
[trainer, fsdp, vllm, recipe] feat: one step off async training recipe (#2231)
imh966
2025-07-17 10:45:53 +08:00 -
ef3fffc3a2
[trainer] refactor: no need to call load_reward_manager in compute_reward_async (#2557)
H
2025-07-16 18:52:36 -07:00 -
f0964b6650
[rollout] fix: fix bug for remax when the rollout mode is async (#2574)
none0663
2025-07-16 22:45:09 +08:00 -
40b2ebe9fd
Merge branch 'volcengine:main' into recipe/async_training
recipe/one_step_off_async
arron
2025-07-16 19:24:55 +08:00 -
8e5b714f0c
Merge pull request #3 from imh966/recipe/async_training_rollout_nodes
arron
2025-07-16 16:58:16 +08:00 -
e3db358fee
Merge branch 'recipe/async_training' into recipe/async_training_rollout_nodes
ArronHZG
2025-07-16 16:50:38 +08:00 -
174d94af20
Merge branch 'recipe/async_training' of https://github.com/imh966/verl into recipe/async_training
ArronHZG
2025-07-16 16:50:15 +08:00 -
c56467fa80
update docs
ArronHZG
2025-07-16 16:49:06 +08:00 -
3f63715a96
[doc] fix: fix non-existing tag of base image in docs (#2569)
Yuchen Cheng
2025-07-16 15:59:40 +08:00 -
1837fc7389
update code and doc by comments
ArronHZG
2025-07-16 15:57:04 +08:00 -
8df1c1bef1
ruff
ArronHZG
2025-07-16 15:49:48 +08:00 -
754cfaead1
update code and doc by comments
ArronHZG
2025-07-16 15:45:39 +08:00 -
1ed49c71e4
rollout.nnodes
ArronHZG
2025-07-16 15:16:13 +08:00 -
96b730bbed
[megatron] fix: wrong response_mask for megatron + sglang mutli-turn (#2543)
杨睿
2025-07-16 14:27:07 +08:00 -
da2ab088d9
[doc] fix: correct link in agentic RL doc (#2567)
OC
2025-07-16 14:26:02 +08:00 -
152c599303
[perf] feat: Clip gsm8k solution string to optimize reward calculation (#2568)
Huapeng Zhou
2025-07-16 01:51:44 -04:00 -
7aabfc437b
[rollout] feat: add ReactAgentLoop based on LangGraph (#2463)
Joel
2025-07-16 13:41:04 +08:00 -
6e21c0a625
[megatron] feat: support distributed megatron model converter and merger (#2281)
杨睿
2025-07-16 13:36:33 +08:00 -
1a89141222
[training_utils] fix: uneven support in split (#2560)
Yuge Zhang
2025-07-16 13:29:27 +08:00 -
e300d0f099
[doc] feat: add document for agentic RL related features (#2563)
OC
2025-07-16 12:51:16 +08:00 -
3f0773259c
[tool] fix: correctly convert 'None' to null in sandbox fusion _process_single_case (#2409)
Mathew Han
2025-07-15 20:53:39 -07:00 -
5f687b211d
[sglang] fix: adding missing param for sgl async unit test (#2561)
Chayenne
2025-07-15 20:22:43 -07:00 -
218298720f
[ci] chore: add single-controller reviewer (#2554)
H
2025-07-15 17:59:45 -07:00 -
f0d4c76ed6
[sglang] feat: update weights in batch with FSDP (#2559)
Chayenne
2025-07-15 16:57:20 -07:00 -
1fe5daf7f1
[sglang, megatron, perf] feat: speed up megatron sglang weight update by 10x (#2418)
杨睿
2025-07-16 05:46:45 +08:00 -
9b5646abcc
Fix pre-commit error: sort imports in async_main_ppo.py
openhands
2025-07-15 20:43:50 +00:00 -
a63243b0dd
[fsdp] fix: change geo3k model name from non-vl to vl (#2555)
Nan Jiang
2025-07-15 12:07:42 -07:00 -
166d91a62e
[trainer] refactor: minor code cleanup (#2537)
H
2025-07-15 09:24:49 -07:00 -
2c0ae781d9
[ray] fix: strip [] for ipv6 address (#2545)
Joel
2025-07-15 20:29:45 +08:00 -
2dea2598a1
[data] fix: Add missing init files in verl experimental data folders (#2548)
Joost van Doorn
2025-07-15 14:29:29 +02:00 -
10f4eb8cfc
[misc] chore: fix typo in function name (#2525)
ShareLer
2025-07-15 19:06:20 +08:00 -
473d8ff0c1
[env] fix: bump tensordict to 0.9.1 (#2541)
Yuge Zhang
2025-07-15 19:04:07 +08:00 -
659b108007
update ruff
ArronHZG
2025-07-15 18:44:14 +08:00 -
d8dd8b020b
Merge branch 'volcengine:main' into recipe/async_training
arron
2025-07-15 14:37:25 +08:00 -
c8468e6d8c
update comments
ArronHZG
2025-07-15 14:21:22 +08:00 -
bbd1288353
[data, megatron] feat: add dynamic batching computational workload balance (#2452)
Simiao Zhang
2025-07-15 14:17:28 +08:00 -
83d6a80ac0
[fsdp] fix: vlm dynamic batch & unify dynamic batch api (#2524)
Yaowei Zheng
2025-07-15 14:07:41 +08:00