diff --git a/dev/bench/data.js b/dev/bench/data.js index 9931e143f..37f662e66 100644 --- a/dev/bench/data.js +++ b/dev/bench/data.js @@ -1,5 +1,5 @@ window.BENCHMARK_DATA = { - "lastUpdate": 1732094857747, + "lastUpdate": 1732095662102, "repoUrl": "https://github.com/pytorch/tensordict", "entries": { "CPU Benchmark Results": [ @@ -334543,6 +334543,1549 @@ window.BENCHMARK_DATA = { "extra": "mean: 25.877353743584745 msec\nrounds: 39" } ] + }, + { + "commit": { + "author": { + "email": "vmoens@meta.com", + "name": "Vincent Moens", + "username": "vmoens" + }, + "committer": { + "email": "vmoens@meta.com", + "name": "Vincent Moens", + "username": "vmoens" + }, + "distinct": true, + "id": "a5656cb03f1dbdf26cb9524dfcdf1a3192b5c4b5", + "message": "[BugFix] fix inline TDParams kwargs for nontensordata\n\nghstack-source-id: afd50385b6b1e8bd8ccfaabfa387ca5611ca07e2\nPull Request resolved: https://github.com/pytorch/tensordict/pull/1094", + "timestamp": "2024-11-20T09:33:00Z", + "tree_id": "afd50385b6b1e8bd8ccfaabfa387ca5611ca07e2", + "url": "https://github.com/pytorch/tensordict/commit/a5656cb03f1dbdf26cb9524dfcdf1a3192b5c4b5" + }, + "date": 1732095637275, + "tool": "pytest", + "benches": [ + { + "name": "benchmarks/common/common_ops_test.py::test_plain_set_nested", + "value": 54070.454114226784, + "unit": "iter/sec", + "range": "stddev: 0.0000014118888696805399", + "extra": "mean: 18.494388781855715 usec\nrounds: 7328" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_plain_set_stack_nested", + "value": 52920.69418651291, + "unit": "iter/sec", + "range": "stddev: 9.256250913518603e-7", + "extra": "mean: 18.896199593973854 usec\nrounds: 12315" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_plain_set_nested_inplace", + "value": 49140.21467760463, + "unit": "iter/sec", + "range": "stddev: 0.0000014939963829387438", + "extra": "mean: 20.34993144740461 usec\nrounds: 30750" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_plain_set_stack_nested_inplace", + "value": 48954.8225456976, + "unit": "iter/sec", + "range": "stddev: 0.0000011437915084545112", + "extra": "mean: 20.426996728801033 usec\nrounds: 32714" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_items", + "value": 240465.07730321086, + "unit": "iter/sec", + "range": "stddev: 3.560360783606818e-7", + "extra": "mean: 4.158608024145913 usec\nrounds: 62736" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_items_nested", + "value": 2942.38060788207, + "unit": "iter/sec", + "range": "stddev: 0.000007239505987872256", + "extra": "mean: 339.86085869421277 usec\nrounds: 2668" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_items_nested_locked", + "value": 2970.37254000148, + "unit": "iter/sec", + "range": "stddev: 0.000007887515132996815", + "extra": "mean: 336.6581082114036 usec\nrounds: 2911" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_items_nested_leaf", + "value": 13945.79290897891, + "unit": "iter/sec", + "range": "stddev: 0.0000026403652709074253", + "extra": "mean: 71.70621323052606 usec\nrounds: 9811" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_items_stack_nested", + "value": 2846.877248678654, + "unit": "iter/sec", + "range": "stddev: 0.00006239376347783408", + "extra": "mean: 351.26207161342796 usec\nrounds: 2723" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_items_stack_nested_leaf", + "value": 13552.14290909017, + "unit": "iter/sec", + "range": "stddev: 0.00000414509587177949", + "extra": "mean: 73.78906839369623 usec\nrounds: 11843" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_items_stack_nested_locked", + "value": 2915.7150757685704, + "unit": "iter/sec", + "range": "stddev: 0.000006106054441136673", + "extra": "mean: 342.96903984570724 usec\nrounds: 2861" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_keys", + "value": 289106.59355911484, + "unit": "iter/sec", + "range": "stddev: 3.070423233046432e-7", + "extra": "mean: 3.458931834411884 usec\nrounds: 108838" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_keys_nested", + "value": 7325.678526815051, + "unit": "iter/sec", + "range": "stddev: 0.000007045188411595878", + "extra": "mean: 136.50612654371622 usec\nrounds: 6156" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_keys_nested_locked", + "value": 7067.017443671768, + "unit": "iter/sec", + "range": "stddev: 0.000022837004444108694", + "extra": "mean: 141.50241002948988 usec\nrounds: 6541" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_keys_nested_leaf", + "value": 8553.887795845327, + "unit": "iter/sec", + "range": "stddev: 0.000011071362729655885", + "extra": "mean: 116.90590569655424 usec\nrounds: 7688" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_keys_stack_nested", + "value": 7317.287898427484, + "unit": "iter/sec", + "range": "stddev: 0.000005306453178178542", + "extra": "mean: 136.6626561481754 usec\nrounds: 6465" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_keys_stack_nested_leaf", + "value": 8524.001215041357, + "unit": "iter/sec", + "range": "stddev: 0.000006847707010147326", + "extra": "mean: 117.31579744913824 usec\nrounds: 7371" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_keys_stack_nested_locked", + "value": 7115.41686394415, + "unit": "iter/sec", + "range": "stddev: 0.000005160711041380114", + "extra": "mean: 140.53990358137494 usec\nrounds: 6451" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_values", + "value": 946039.6716350286, + "unit": "iter/sec", + "range": "stddev: 8.84678652679667e-8", + "extra": "mean: 1.0570381242804787 usec\nrounds: 179534" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_values_nested", + "value": 17922.018037968188, + "unit": "iter/sec", + "range": "stddev: 0.000004190143606558801", + "extra": "mean: 55.79728788808705 usec\nrounds: 12748" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_values_nested_locked", + "value": 18040.779246698083, + "unit": "iter/sec", + "range": "stddev: 0.0000034261683374094694", + "extra": "mean: 55.429978180295365 usec\nrounds: 16545" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_values_nested_leaf", + "value": 16658.51370274145, + "unit": "iter/sec", + "range": "stddev: 0.0000025174324345902337", + "extra": "mean: 60.02936503485497 usec\nrounds: 14037" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_values_stack_nested", + "value": 17397.221589179462, + "unit": "iter/sec", + "range": "stddev: 0.000008119882866830397", + "extra": "mean: 57.4804427749526 usec\nrounds: 14644" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_values_stack_nested_leaf", + "value": 16363.472343178584, + "unit": "iter/sec", + "range": "stddev: 0.000004063237860443151", + "extra": "mean: 61.11172366278777 usec\nrounds: 14001" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_values_stack_nested_locked", + "value": 17927.701897829513, + "unit": "iter/sec", + "range": "stddev: 0.000002142176363969026", + "extra": "mean: 55.77959772529846 usec\nrounds: 16270" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_membership", + "value": 1138030.902125495, + "unit": "iter/sec", + "range": "stddev: 1.4553080792207906e-7", + "extra": "mean: 878.7107609576371 nsec\nrounds: 176992" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_membership_nested", + "value": 357396.6391856059, + "unit": "iter/sec", + "range": "stddev: 3.5846352177381453e-7", + "extra": "mean: 2.7980117616066122 usec\nrounds: 141985" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_membership_nested_leaf", + "value": 363597.97188470926, + "unit": "iter/sec", + "range": "stddev: 2.930138549756766e-7", + "extra": "mean: 2.7502903682781903 usec\nrounds: 163613" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_membership_stacked_nested", + "value": 367025.08150044293, + "unit": "iter/sec", + "range": "stddev: 3.204818003268277e-7", + "extra": "mean: 2.724609435169605 usec\nrounds: 92507" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_membership_stacked_nested_leaf", + "value": 368484.84913398256, + "unit": "iter/sec", + "range": "stddev: 3.219229203936832e-7", + "extra": "mean: 2.713815784692944 usec\nrounds: 106191" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_membership_nested_last", + "value": 247992.33896895437, + "unit": "iter/sec", + "range": "stddev: 4.3771022601353134e-7", + "extra": "mean: 4.032382629873045 usec\nrounds: 92251" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_membership_nested_leaf_last", + "value": 244115.7986774241, + "unit": "iter/sec", + "range": "stddev: 6.117382893044608e-7", + "extra": "mean: 4.096416558935644 usec\nrounds: 110779" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_membership_stacked_nested_last", + "value": 213071.00021820032, + "unit": "iter/sec", + "range": "stddev: 6.062599365222637e-7", + "extra": "mean: 4.693271252192587 usec\nrounds: 52313" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_membership_stacked_nested_leaf_last", + "value": 214498.00399872765, + "unit": "iter/sec", + "range": "stddev: 4.3192994356688986e-7", + "extra": "mean: 4.6620480440737895 usec\nrounds: 64025" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_nested_getleaf", + "value": 93260.92911212966, + "unit": "iter/sec", + "range": "stddev: 6.237552076693799e-7", + "extra": "mean: 10.722603876245733 usec\nrounds: 63980" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_nested_get", + "value": 98833.04148623183, + "unit": "iter/sec", + "range": "stddev: 7.334940912229854e-7", + "extra": "mean: 10.118073722736819 usec\nrounds: 66099" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_stacked_getleaf", + "value": 94012.8846918902, + "unit": "iter/sec", + "range": "stddev: 0.0000010221058609195385", + "extra": "mean: 10.636839868038457 usec\nrounds: 40991" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_stacked_get", + "value": 98570.08631560058, + "unit": "iter/sec", + "range": "stddev: 9.437748996900453e-7", + "extra": "mean: 10.145065682485164 usec\nrounds: 56971" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_nested_getitemleaf", + "value": 90402.99202998953, + "unit": "iter/sec", + "range": "stddev: 6.768460372944996e-7", + "extra": "mean: 11.061580790028149 usec\nrounds: 49412" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_nested_getitem", + "value": 96852.51785464071, + "unit": "iter/sec", + "range": "stddev: 8.762513685810162e-7", + "extra": "mean: 10.324976801334493 usec\nrounds: 63452" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_stacked_getitemleaf", + "value": 90994.29634372881, + "unit": "iter/sec", + "range": "stddev: 8.564683354887144e-7", + "extra": "mean: 10.989699796375406 usec\nrounds: 48547" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_stacked_getitem", + "value": 95728.5246397221, + "unit": "iter/sec", + "range": "stddev: 6.806888863821701e-7", + "extra": "mean: 10.446207165142653 usec\nrounds: 53175" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_lock_nested", + "value": 1833.8512233110373, + "unit": "iter/sec", + "range": "stddev: 0.0033524800050902933", + "extra": "mean: 545.3005059998759 usec\nrounds: 1000" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_lock_stack_nested", + "value": 2439.4196000023367, + "unit": "iter/sec", + "range": "stddev: 0.00002068395890727959", + "extra": "mean: 409.9335760026861 usec\nrounds: 1000" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_unlock_nested", + "value": 2759.1324725821974, + "unit": "iter/sec", + "range": "stddev: 0.00007475249380188844", + "extra": "mean: 362.4327609990132 usec\nrounds: 1000" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_unlock_stack_nested", + "value": 2943.0499815774633, + "unit": "iter/sec", + "range": "stddev: 0.000022268389010556902", + "extra": "mean: 339.7835600005692 usec\nrounds: 1000" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_flatten_speed", + "value": 10740.784721379812, + "unit": "iter/sec", + "range": "stddev: 0.0000037285358444008676", + "extra": "mean: 93.103067042157 usec\nrounds: 7816" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_unflatten_speed", + "value": 2124.02747031726, + "unit": "iter/sec", + "range": "stddev: 0.000012667890481812045", + "extra": "mean: 470.8037038007954 usec\nrounds: 1921" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_common_ops", + "value": 1186.9566939667393, + "unit": "iter/sec", + "range": "stddev: 0.0001536316979317013", + "extra": "mean: 842.4907202452846 usec\nrounds: 815" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_creation", + "value": 490372.9675119075, + "unit": "iter/sec", + "range": "stddev: 5.186536863797685e-7", + "extra": "mean: 2.0392641239460603 usec\nrounds: 89598" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_creation_empty", + "value": 79123.94515908413, + "unit": "iter/sec", + "range": "stddev: 0.0000010190784733015442", + "extra": "mean: 12.638399134287747 usec\nrounds: 17092" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_creation_nested_1", + "value": 64126.33569082688, + "unit": "iter/sec", + "range": "stddev: 0.0000012621895375448455", + "extra": "mean: 15.59421709079578 usec\nrounds: 19052" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_creation_nested_2", + "value": 51069.01118294034, + "unit": "iter/sec", + "range": "stddev: 0.0000014454989946748633", + "extra": "mean: 19.581346433706774 usec\nrounds: 17429" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_clone", + "value": 74846.82069644179, + "unit": "iter/sec", + "range": "stddev: 0.000003688670097621941", + "extra": "mean: 13.360620941478945 usec\nrounds: 13610" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_getitem[int]", + "value": 79683.76947943734, + "unit": "iter/sec", + "range": "stddev: 0.00001249228331095498", + "extra": "mean: 12.549607109865118 usec\nrounds: 10774" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_getitem[slice_int]", + "value": 41480.197677261036, + "unit": "iter/sec", + "range": "stddev: 0.000008175786273824666", + "extra": "mean: 24.107888968624383 usec\nrounds: 8376" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_getitem[range]", + "value": 19914.583308240253, + "unit": "iter/sec", + "range": "stddev: 0.000010075098685277646", + "extra": "mean: 50.21445764251668 usec\nrounds: 4521" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_getitem[tuple]", + "value": 49999.67410819609, + "unit": "iter/sec", + "range": "stddev: 0.000007701902711076513", + "extra": "mean: 20.000130357571212 usec\nrounds: 14138" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_getitem[list]", + "value": 21667.06409752263, + "unit": "iter/sec", + "range": "stddev: 0.000009589440814314864", + "extra": "mean: 46.15299957110193 usec\nrounds: 6993" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_setitem_dim[int]", + "value": 36923.13736253571, + "unit": "iter/sec", + "range": "stddev: 0.000003843531245226354", + "extra": "mean: 27.083289000643163 usec\nrounds: 1000" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_setitem_dim[slice_int]", + "value": 18771.046449951184, + "unit": "iter/sec", + "range": "stddev: 0.000004793114846709568", + "extra": "mean: 53.27353499797027 usec\nrounds: 1000" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_setitem_dim[range]", + "value": 13376.260786085444, + "unit": "iter/sec", + "range": "stddev: 0.000005581618052225133", + "extra": "mean: 74.75930800035258 usec\nrounds: 1000" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_setitem_dim[tuple]", + "value": 24230.469956718953, + "unit": "iter/sec", + "range": "stddev: 0.0000032680608264306354", + "extra": "mean: 41.27035099963905 usec\nrounds: 1000" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_setitem", + "value": 45957.49319316475, + "unit": "iter/sec", + "range": "stddev: 0.000005749702743843777", + "extra": "mean: 21.7592372977543 usec\nrounds: 15272" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_set", + "value": 47284.93083739411, + "unit": "iter/sec", + "range": "stddev: 0.000003975419269749503", + "extra": "mean: 21.148386648567858 usec\nrounds: 13167" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_set_shared", + "value": 5651.144860582322, + "unit": "iter/sec", + "range": "stddev: 0.00013259593236670283", + "extra": "mean: 176.95529395736548 usec\nrounds: 3310" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_update", + "value": 40182.665366342546, + "unit": "iter/sec", + "range": "stddev: 0.000006032870004554629", + "extra": "mean: 24.886353129715765 usec\nrounds: 21165" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_update_nested", + "value": 28485.32846681369, + "unit": "iter/sec", + "range": "stddev: 0.000005858730437915923", + "extra": "mean: 35.105791431017956 usec\nrounds: 11459" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_update__nested", + "value": 30073.71991299626, + "unit": "iter/sec", + "range": "stddev: 0.000010648969976151674", + "extra": "mean: 33.251623107916664 usec\nrounds: 7729" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_set_nested", + "value": 42740.417867448356, + "unit": "iter/sec", + "range": "stddev: 0.000006494102625892744", + "extra": "mean: 23.397057162644465 usec\nrounds: 13173" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_set_nested_new", + "value": 35798.07149221241, + "unit": "iter/sec", + "range": "stddev: 0.000005390623530889732", + "extra": "mean: 27.934465693704816 usec\nrounds: 12753" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_select", + "value": 22425.52383203921, + "unit": "iter/sec", + "range": "stddev: 0.000004889012495757051", + "extra": "mean: 44.592046432882256 usec\nrounds: 9476" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_select_nested", + "value": 16971.30767519473, + "unit": "iter/sec", + "range": "stddev: 0.000004981172437592046", + "extra": "mean: 58.922978661308484 usec\nrounds: 11200" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_exclude_nested", + "value": 13253.593010985229, + "unit": "iter/sec", + "range": "stddev: 0.000010528888622412689", + "extra": "mean: 75.45123795269335 usec\nrounds: 9317" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_empty[True]", + "value": 2788.291287667574, + "unit": "iter/sec", + "range": "stddev: 0.000059927834945754724", + "extra": "mean: 358.64258674225795 usec\nrounds: 2519" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_empty[False]", + "value": 814879.0711570994, + "unit": "iter/sec", + "range": "stddev: 1.1009509875093787e-7", + "extra": "mean: 1.2271759521078818 usec\nrounds: 193088" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_unbind_speed", + "value": 3865.4829712540127, + "unit": "iter/sec", + "range": "stddev: 0.000008636926809650952", + "extra": "mean: 258.6998849656262 usec\nrounds: 765" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_unbind_speed_stack0", + "value": 3913.661685157648, + "unit": "iter/sec", + "range": "stddev: 0.000008711867289296948", + "extra": "mean: 255.51518768023467 usec\nrounds: 3474" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_unbind_speed_stack1", + "value": 1405.0529110043956, + "unit": "iter/sec", + "range": "stddev: 0.002994220401172104", + "extra": "mean: 711.7169696372179 usec\nrounds: 1482" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_split", + "value": 571.2576104184063, + "unit": "iter/sec", + "range": "stddev: 0.004901015092549829", + "extra": "mean: 1.750523724782537 msec\nrounds: 585" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_chunk", + "value": 570.5848281280206, + "unit": "iter/sec", + "range": "stddev: 0.004774594667696988", + "extra": "mean: 1.7525877848536706 msec\nrounds: 581" + }, + { + "name": "benchmarks/common/h2d_test.py::TestConsolidate::test_consolidate_njt[False-None]", + "value": 116.56138674973883, + "unit": "iter/sec", + "range": "stddev: 0.00014334716113744946", + "extra": "mean: 8.579170408696605 msec\nrounds: 115" + }, + { + "name": "benchmarks/common/memmap_benchmarks_test.py::test_creation[device0]", + "value": 10581.553970009365, + "unit": "iter/sec", + "range": "stddev: 0.000014010116046277366", + "extra": "mean: 94.50407783528179 usec\nrounds: 2698" + }, + { + "name": "benchmarks/common/memmap_benchmarks_test.py::test_creation_from_tensor", + "value": 9569.550786674361, + "unit": "iter/sec", + "range": "stddev: 0.0000561079087499082", + "extra": "mean: 104.49811305589226 usec\nrounds: 5599" + }, + { + "name": "benchmarks/common/memmap_benchmarks_test.py::test_add_one[memmap_tensor0]", + "value": 202280.2638696418, + "unit": "iter/sec", + "range": "stddev: 0.0000073833996105509885", + "extra": "mean: 4.943636026915821 usec\nrounds: 21323" + }, + { + "name": "benchmarks/common/memmap_benchmarks_test.py::test_contiguous[memmap_tensor0]", + "value": 1931574.4742855981, + "unit": "iter/sec", + "range": "stddev: 1.1885851496381063e-7", + "extra": "mean: 517.7123705622869 nsec\nrounds: 68790" + }, + { + "name": "benchmarks/common/memmap_benchmarks_test.py::test_stack[memmap_tensor0]", + "value": 281813.25321473234, + "unit": "iter/sec", + "range": "stddev: 0.0000010726480538607733", + "extra": "mean: 3.548449154156825 usec\nrounds: 23099" + }, + { + "name": "benchmarks/common/memmap_benchmarks_test.py::test_memmaptd_index", + "value": 4124.430888940069, + "unit": "iter/sec", + "range": "stddev: 0.00005766565530181734", + "extra": "mean: 242.45769341936736 usec\nrounds: 1732" + }, + { + "name": "benchmarks/common/memmap_benchmarks_test.py::test_memmaptd_index_astensor", + "value": 3124.5133985184125, + "unit": "iter/sec", + "range": "stddev: 0.00005595112947468305", + "extra": "mean: 320.04983575176277 usec\nrounds: 2618" + }, + { + "name": "benchmarks/common/memmap_benchmarks_test.py::test_memmaptd_index_op", + "value": 1600.282243509325, + "unit": "iter/sec", + "range": "stddev: 0.00007348716528984957", + "extra": "mean: 624.8897680743233 usec\nrounds: 1397" + }, + { + "name": "benchmarks/common/memmap_benchmarks_test.py::test_serialize_model", + "value": 7.439291486469089, + "unit": "iter/sec", + "range": "stddev: 0.04574376405721572", + "extra": "mean: 134.4214031428724 msec\nrounds: 7" + }, + { + "name": "benchmarks/common/memmap_benchmarks_test.py::test_serialize_model_pickle", + "value": 2.5062435665039815, + "unit": "iter/sec", + "range": "stddev: 0.0685585434023953", + "extra": "mean: 399.0035180000177 msec\nrounds: 5" + }, + { + "name": "benchmarks/common/memmap_benchmarks_test.py::test_serialize_weights", + "value": 8.663730157903968, + "unit": "iter/sec", + "range": "stddev: 0.004611653626524735", + "extra": "mean: 115.42372416662754 msec\nrounds: 6" + }, + { + "name": "benchmarks/common/memmap_benchmarks_test.py::test_serialize_weights_returnearly", + "value": 6.265940890418302, + "unit": "iter/sec", + "range": "stddev: 0.00196529898694413", + "extra": "mean: 159.59295140003178 msec\nrounds: 5" + }, + { + "name": "benchmarks/common/memmap_benchmarks_test.py::test_serialize_weights_pickle", + "value": 2.2769262538587904, + "unit": "iter/sec", + "range": "stddev: 0.10738353163781476", + "extra": "mean: 439.18857639998805 msec\nrounds: 5" + }, + { + "name": "benchmarks/common/memmap_benchmarks_test.py::test_serialize_weights_filesystem", + "value": 6.224004373206632, + "unit": "iter/sec", + "range": "stddev: 0.041350162523725295", + "extra": "mean: 160.66826757141175 msec\nrounds: 7" + }, + { + "name": "benchmarks/common/memmap_benchmarks_test.py::test_serialize_model_filesystem", + "value": 6.315375697867116, + "unit": "iter/sec", + "range": "stddev: 0.00855122458309391", + "extra": "mean: 158.34370714282744 msec\nrounds: 7" + }, + { + "name": "benchmarks/common/pytree_benchmarks_test.py::test_reshape_pytree", + "value": 37695.783410229065, + "unit": "iter/sec", + "range": "stddev: 0.0000017433089373391122", + "extra": "mean: 26.528166005130473 usec\nrounds: 9819" + }, + { + "name": "benchmarks/common/pytree_benchmarks_test.py::test_reshape_td", + "value": 29996.772878213826, + "unit": "iter/sec", + "range": "stddev: 0.0000018310888949923794", + "extra": "mean: 33.33691940996373 usec\nrounds: 7656" + }, + { + "name": "benchmarks/common/pytree_benchmarks_test.py::test_view_pytree", + "value": 37599.8395769402, + "unit": "iter/sec", + "range": "stddev: 0.000001724151178574738", + "extra": "mean: 26.595858153961252 usec\nrounds: 13000" + }, + { + "name": "benchmarks/common/pytree_benchmarks_test.py::test_view_td", + "value": 26299.467136173385, + "unit": "iter/sec", + "range": "stddev: 0.000004400368579444876", + "extra": "mean: 38.023584083365634 usec\nrounds: 9009" + }, + { + "name": "benchmarks/common/pytree_benchmarks_test.py::test_unbind_pytree", + "value": 33813.422960574026, + "unit": "iter/sec", + "range": "stddev: 0.0000019220544557393224", + "extra": "mean: 29.57405410170943 usec\nrounds: 10277" + }, + { + "name": "benchmarks/common/pytree_benchmarks_test.py::test_unbind_td", + "value": 26006.967332754542, + "unit": "iter/sec", + "range": "stddev: 0.000003921450398016621", + "extra": "mean: 38.45123451747284 usec\nrounds: 10980" + }, + { + "name": "benchmarks/common/pytree_benchmarks_test.py::test_split_pytree", + "value": 33546.56790256644, + "unit": "iter/sec", + "range": "stddev: 0.000002023251137534769", + "extra": "mean: 29.80930874670777 usec\nrounds: 11239" + }, + { + "name": "benchmarks/common/pytree_benchmarks_test.py::test_split_td", + "value": 22730.795827656635, + "unit": "iter/sec", + "range": "stddev: 0.000014313054609583999", + "extra": "mean: 43.99318033481681 usec\nrounds: 9621" + }, + { + "name": "benchmarks/common/pytree_benchmarks_test.py::test_add_pytree", + "value": 26600.81763322725, + "unit": "iter/sec", + "range": "stddev: 0.0000050117418185382095", + "extra": "mean: 37.592829430584636 usec\nrounds: 7047" + }, + { + "name": "benchmarks/common/pytree_benchmarks_test.py::test_add_td", + "value": 17162.030647408417, + "unit": "iter/sec", + "range": "stddev: 0.000007082130967469218", + "extra": "mean: 58.268163048118474 usec\nrounds: 6587" + }, + { + "name": "benchmarks/compile/compile_td_test.py::test_compile_add_one_nested[tensordict-compile]", + "value": 15723.565330447023, + "unit": "iter/sec", + "range": "stddev: 0.000004831843029091212", + "extra": "mean: 63.59880720332593 usec\nrounds: 11717" + }, + { + "name": "benchmarks/compile/compile_td_test.py::test_compile_add_one_nested[tensordict-eager]", + "value": 6255.48901104438, + "unit": "iter/sec", + "range": "stddev: 0.000012521313793501533", + "extra": "mean: 159.85960461835194 usec\nrounds: 5501" + }, + { + "name": "benchmarks/compile/compile_td_test.py::test_compile_add_one_nested[pytree-compile]", + "value": 21119.008623968573, + "unit": "iter/sec", + "range": "stddev: 0.000003777516500967989", + "extra": "mean: 47.35070749793961 usec\nrounds: 13764" + }, + { + "name": "benchmarks/compile/compile_td_test.py::test_compile_add_one_nested[pytree-eager]", + "value": 8449.776067862225, + "unit": "iter/sec", + "range": "stddev: 0.0000069807211905499225", + "extra": "mean: 118.34633154402609 usec\nrounds: 7272" + }, + { + "name": "benchmarks/compile/compile_td_test.py::test_compile_copy_nested[tensordict-compile]", + "value": 38429.71091784393, + "unit": "iter/sec", + "range": "stddev: 0.0000016542668901456788", + "extra": "mean: 26.02153323863994 usec\nrounds: 20383" + }, + { + "name": "benchmarks/compile/compile_td_test.py::test_compile_copy_nested[tensordict-eager]", + "value": 18667.62388826333, + "unit": "iter/sec", + "range": "stddev: 0.0000029679827467155007", + "extra": "mean: 53.56868158398659 usec\nrounds: 16312" + }, + { + "name": "benchmarks/compile/compile_td_test.py::test_compile_copy_nested[pytree-compile]", + "value": 12418.084094396718, + "unit": "iter/sec", + "range": "stddev: 0.000003948106417833679", + "extra": "mean: 80.52772008938315 usec\nrounds: 10314" + }, + { + "name": "benchmarks/compile/compile_td_test.py::test_compile_copy_nested[pytree-eager]", + "value": 14718.841853896174, + "unit": "iter/sec", + "range": "stddev: 0.000003362012192916804", + "extra": "mean: 67.94012802952248 usec\nrounds: 12794" + }, + { + "name": "benchmarks/compile/compile_td_test.py::test_compile_add_one_flat[tensordict-compile]", + "value": 9219.06792465769, + "unit": "iter/sec", + "range": "stddev: 0.000009675657900352799", + "extra": "mean: 108.47083546541184 usec\nrounds: 6953" + }, + { + "name": "benchmarks/compile/compile_td_test.py::test_compile_add_one_flat[tensordict-eager]", + "value": 5094.064090928839, + "unit": "iter/sec", + "range": "stddev: 0.000007336037116309624", + "extra": "mean: 196.3069137235104 usec\nrounds: 4671" + }, + { + "name": "benchmarks/compile/compile_td_test.py::test_compile_add_one_flat[tensorclass-compile]", + "value": 22375.34200003914, + "unit": "iter/sec", + "range": "stddev: 0.0000050574964732544534", + "extra": "mean: 44.69205431578435 usec\nrounds: 12004" + }, + { + "name": "benchmarks/compile/compile_td_test.py::test_compile_add_one_flat[tensorclass-eager]", + "value": 16423.631892110858, + "unit": "iter/sec", + "range": "stddev: 0.0000059271760737881384", + "extra": "mean: 60.88787221785902 usec\nrounds: 12490" + }, + { + "name": "benchmarks/compile/compile_td_test.py::test_compile_add_one_flat[pytree-compile]", + "value": 9649.668222464321, + "unit": "iter/sec", + "range": "stddev: 0.000009351072783316206", + "extra": "mean: 103.63050593511713 usec\nrounds: 6740" + }, + { + "name": "benchmarks/compile/compile_td_test.py::test_compile_add_one_flat[pytree-eager]", + "value": 4972.860871901239, + "unit": "iter/sec", + "range": "stddev: 0.00001613905244887844", + "extra": "mean: 201.091489538833 usec\nrounds: 4684" + }, + { + "name": "benchmarks/compile/compile_td_test.py::test_compile_add_self_flat[tensordict-eager]", + "value": 4779.791520430543, + "unit": "iter/sec", + "range": "stddev: 0.00000830522904790458", + "extra": "mean: 209.21414578975703 usec\nrounds: 4335" + }, + { + "name": "benchmarks/compile/compile_td_test.py::test_compile_add_self_flat[tensordict-compile]", + "value": 9296.105809338005, + "unit": "iter/sec", + "range": "stddev: 0.000007477173124110195", + "extra": "mean: 107.57192533194845 usec\nrounds: 6549" + }, + { + "name": "benchmarks/compile/compile_td_test.py::test_compile_add_self_flat[tensorclass-eager]", + "value": 17948.96107078432, + "unit": "iter/sec", + "range": "stddev: 0.000011998336020977977", + "extra": "mean: 55.713531053767156 usec\nrounds: 13219" + }, + { + "name": "benchmarks/compile/compile_td_test.py::test_compile_add_self_flat[tensorclass-compile]", + "value": 20743.82021321147, + "unit": "iter/sec", + "range": "stddev: 0.000005338258160563395", + "extra": "mean: 48.20712818187235 usec\nrounds: 11866" + }, + { + "name": "benchmarks/compile/compile_td_test.py::test_compile_add_self_flat[pytree-eager]", + "value": 6213.755985534642, + "unit": "iter/sec", + "range": "stddev: 0.000013236597551885136", + "extra": "mean: 160.93325877745397 usec\nrounds: 5839" + }, + { + "name": "benchmarks/compile/compile_td_test.py::test_compile_add_self_flat[pytree-compile]", + "value": 9523.44092204183, + "unit": "iter/sec", + "range": "stddev: 0.000010271301310794241", + "extra": "mean: 105.00406399177827 usec\nrounds: 7626" + }, + { + "name": "benchmarks/compile/compile_td_test.py::test_compile_copy_flat[tensordict-compile]", + "value": 47452.219159520566, + "unit": "iter/sec", + "range": "stddev: 0.0000019504209271618517", + "extra": "mean: 21.073830006522787 usec\nrounds: 14377" + }, + { + "name": "benchmarks/compile/compile_td_test.py::test_compile_copy_flat[tensordict-eager]", + "value": 17234.417090764728, + "unit": "iter/sec", + "range": "stddev: 0.0000054895377059512786", + "extra": "mean: 58.02343036805476 usec\nrounds: 15352" + }, + { + "name": "benchmarks/compile/compile_td_test.py::test_compile_copy_flat[pytree-compile]", + "value": 12430.68926882803, + "unit": "iter/sec", + "range": "stddev: 0.000004141230911248542", + "extra": "mean: 80.44606203033827 usec\nrounds: 10656" + }, + { + "name": "benchmarks/compile/compile_td_test.py::test_compile_copy_flat[pytree-eager]", + "value": 14324.930272558922, + "unit": "iter/sec", + "range": "stddev: 0.000006183863623640547", + "extra": "mean: 69.80836771789507 usec\nrounds: 12855" + }, + { + "name": "benchmarks/compile/compile_td_test.py::test_compile_assign_and_add[tensordict-compile]", + "value": 4765.832406280223, + "unit": "iter/sec", + "range": "stddev: 0.000009536115224971649", + "extra": "mean: 209.82693362910538 usec\nrounds: 3149" + }, + { + "name": "benchmarks/compile/compile_td_test.py::test_compile_assign_and_add[tensordict-eager]", + "value": 780.2381294706282, + "unit": "iter/sec", + "range": "stddev: 0.000027932423261055073", + "extra": "mean: 1.2816599986961348 msec\nrounds: 767" + }, + { + "name": "benchmarks/compile/compile_td_test.py::test_compile_assign_and_add[pytree-compile]", + "value": 4926.425651944925, + "unit": "iter/sec", + "range": "stddev: 0.000015097472689242502", + "extra": "mean: 202.98692615105347 usec\nrounds: 2803" + }, + { + "name": "benchmarks/compile/compile_td_test.py::test_compile_assign_and_add[pytree-eager]", + "value": 1291.7319109373661, + "unit": "iter/sec", + "range": "stddev: 0.00001474748117459105", + "extra": "mean: 774.1544445351155 usec\nrounds: 1235" + }, + { + "name": "benchmarks/compile/compile_td_test.py::test_compile_assign_and_add_stack[compile]", + "value": 2192.8784289449563, + "unit": "iter/sec", + "range": "stddev: 0.000013505970623844838", + "extra": "mean: 456.021632025047 usec\nrounds: 1655" + }, + { + "name": "benchmarks/compile/compile_td_test.py::test_compile_assign_and_add_stack[eager]", + "value": 358.9546874278206, + "unit": "iter/sec", + "range": "stddev: 0.000054941780650206466", + "extra": "mean: 2.785866949295883 msec\nrounds: 355" + }, + { + "name": "benchmarks/compile/compile_td_test.py::test_compile_indexing[tensor-tensordict-compile]", + "value": 27314.702731892732, + "unit": "iter/sec", + "range": "stddev: 0.000004660294711242929", + "extra": "mean: 36.61031971738784 usec\nrounds: 17112" + }, + { + "name": "benchmarks/compile/compile_td_test.py::test_compile_indexing[tensor-tensordict-eager]", + "value": 28465.48333718255, + "unit": "iter/sec", + "range": "stddev: 0.00001199259326725608", + "extra": "mean: 35.13026594892794 usec\nrounds: 19876" + }, + { + "name": "benchmarks/compile/compile_td_test.py::test_compile_indexing[tensor-tensorclass-compile]", + "value": 33289.69807132856, + "unit": "iter/sec", + "range": "stddev: 0.000002970161830502405", + "extra": "mean: 30.039323212164263 usec\nrounds: 15940" + }, + { + "name": "benchmarks/compile/compile_td_test.py::test_compile_indexing[tensor-tensorclass-eager]", + "value": 41636.9503739873, + "unit": "iter/sec", + "range": "stddev: 0.0000026892566943227764", + "extra": "mean: 24.017128800690223 usec\nrounds: 24169" + }, + { + "name": "benchmarks/compile/compile_td_test.py::test_compile_indexing[tensor-pytree-compile]", + "value": 32451.59843438193, + "unit": "iter/sec", + "range": "stddev: 0.0000028855895375486813", + "extra": "mean: 30.815123083136534 usec\nrounds: 19499" + }, + { + "name": "benchmarks/compile/compile_td_test.py::test_compile_indexing[tensor-pytree-eager]", + "value": 41782.65141111005, + "unit": "iter/sec", + "range": "stddev: 0.000003030982595237167", + "extra": "mean: 23.933378237794145 usec\nrounds: 24749" + }, + { + "name": "benchmarks/compile/compile_td_test.py::test_compile_indexing[slice-tensordict-compile]", + "value": 18930.128186169517, + "unit": "iter/sec", + "range": "stddev: 0.000004463901120356049", + "extra": "mean: 52.825844081214775 usec\nrounds: 10685" + }, + { + "name": "benchmarks/compile/compile_td_test.py::test_compile_indexing[slice-tensordict-eager]", + "value": 49917.249024767174, + "unit": "iter/sec", + "range": "stddev: 0.000011075715489618732", + "extra": "mean: 20.03315526269958 usec\nrounds: 31437" + }, + { + "name": "benchmarks/compile/compile_td_test.py::test_compile_indexing[slice-tensorclass-compile]", + "value": 22151.783177019606, + "unit": "iter/sec", + "range": "stddev: 0.000003997045278863659", + "extra": "mean: 45.14309263542297 usec\nrounds: 12533" + }, + { + "name": "benchmarks/compile/compile_td_test.py::test_compile_indexing[slice-tensorclass-eager]", + "value": 53113.72158917476, + "unit": "iter/sec", + "range": "stddev: 0.000001585235370764182", + "extra": "mean: 18.827526486184176 usec\nrounds: 33338" + }, + { + "name": "benchmarks/compile/compile_td_test.py::test_compile_indexing[slice-pytree-compile]", + "value": 21965.934335651924, + "unit": "iter/sec", + "range": "stddev: 0.0000037855504349277846", + "extra": "mean: 45.525038212326116 usec\nrounds: 15623" + }, + { + "name": "benchmarks/compile/compile_td_test.py::test_compile_indexing[slice-pytree-eager]", + "value": 52437.53059413641, + "unit": "iter/sec", + "range": "stddev: 0.0000016880563593947012", + "extra": "mean: 19.07031068529799 usec\nrounds: 19943" + }, + { + "name": "benchmarks/compile/compile_td_test.py::test_compile_indexing[int-tensordict-compile]", + "value": 18602.12094788515, + "unit": "iter/sec", + "range": "stddev: 0.0000044894552493874224", + "extra": "mean: 53.75731094328191 usec\nrounds: 11478" + }, + { + "name": "benchmarks/compile/compile_td_test.py::test_compile_indexing[int-tensordict-eager]", + "value": 49766.240932245564, + "unit": "iter/sec", + "range": "stddev: 0.000011539868452745927", + "extra": "mean: 20.093942826854327 usec\nrounds: 33250" + }, + { + "name": "benchmarks/compile/compile_td_test.py::test_compile_indexing[int-tensorclass-compile]", + "value": 21813.843743529615, + "unit": "iter/sec", + "range": "stddev: 0.0000037546498355401437", + "extra": "mean: 45.842448114932445 usec\nrounds: 14108" + }, + { + "name": "benchmarks/compile/compile_td_test.py::test_compile_indexing[int-tensorclass-eager]", + "value": 53151.20288788852, + "unit": "iter/sec", + "range": "stddev: 0.0000016096328064822682", + "extra": "mean: 18.81424964378122 usec\nrounds: 33664" + }, + { + "name": "benchmarks/compile/compile_td_test.py::test_compile_indexing[int-pytree-compile]", + "value": 21963.32198880705, + "unit": "iter/sec", + "range": "stddev: 0.0000035956479324875354", + "extra": "mean: 45.53045302116046 usec\nrounds: 15869" + }, + { + "name": "benchmarks/compile/compile_td_test.py::test_compile_indexing[int-pytree-eager]", + "value": 52819.91162505896, + "unit": "iter/sec", + "range": "stddev: 0.000001669063479501457", + "extra": "mean: 18.93225431913781 usec\nrounds: 33973" + }, + { + "name": "benchmarks/compile/tensordict_nn_test.py::test_mod_add[eager]", + "value": 36263.33983253143, + "unit": "iter/sec", + "range": "stddev: 0.0000028694060711675915", + "extra": "mean: 27.576059034223633 usec\nrounds: 21174" + }, + { + "name": "benchmarks/compile/tensordict_nn_test.py::test_mod_add[compile]", + "value": 21950.739164961033, + "unit": "iter/sec", + "range": "stddev: 0.0000039099265250500605", + "extra": "mean: 45.55655244613605 usec\nrounds: 8361" + }, + { + "name": "benchmarks/compile/tensordict_nn_test.py::test_mod_add[compile-overhead]", + "value": 21546.4747009932, + "unit": "iter/sec", + "range": "stddev: 0.000005048279034589639", + "extra": "mean: 46.41130458125033 usec\nrounds: 6678" + }, + { + "name": "benchmarks/compile/tensordict_nn_test.py::test_mod_wrap[eager]", + "value": 4449.802148481416, + "unit": "iter/sec", + "range": "stddev: 0.000014684093423977847", + "extra": "mean: 224.72909280725435 usec\nrounds: 3976" + }, + { + "name": "benchmarks/compile/tensordict_nn_test.py::test_mod_wrap[compile]", + "value": 4790.025670734134, + "unit": "iter/sec", + "range": "stddev: 0.000035403122064919024", + "extra": "mean: 208.7671483912396 usec\nrounds: 2608" + }, + { + "name": "benchmarks/compile/tensordict_nn_test.py::test_mod_wrap[compile-overhead]", + "value": 4854.163738217384, + "unit": "iter/sec", + "range": "stddev: 0.00001789261669366504", + "extra": "mean: 206.0087079730925 usec\nrounds: 2308" + }, + { + "name": "benchmarks/compile/tensordict_nn_test.py::test_mod_wrap_and_backward[eager]", + "value": 88.08010243271825, + "unit": "iter/sec", + "range": "stddev: 0.00033621833623786036", + "extra": "mean: 11.353301964695943 msec\nrounds: 85" + }, + { + "name": "benchmarks/compile/tensordict_nn_test.py::test_mod_wrap_and_backward[compile]", + "value": 75.86170360856009, + "unit": "iter/sec", + "range": "stddev: 0.001047677779477295", + "extra": "mean: 13.181881666669584 msec\nrounds: 72" + }, + { + "name": "benchmarks/compile/tensordict_nn_test.py::test_mod_wrap_and_backward[compile-overhead]", + "value": 74.33801407836818, + "unit": "iter/sec", + "range": "stddev: 0.0012585980110768201", + "extra": "mean: 13.452067726019504 msec\nrounds: 73" + }, + { + "name": "benchmarks/compile/tensordict_nn_test.py::test_seq_add[eager]", + "value": 9977.50273532101, + "unit": "iter/sec", + "range": "stddev: 0.000012811786925784262", + "extra": "mean: 100.22547991492249 usec\nrounds: 8414" + }, + { + "name": "benchmarks/compile/tensordict_nn_test.py::test_seq_add[compile]", + "value": 16039.761728804026, + "unit": "iter/sec", + "range": "stddev: 0.000006773990820970023", + "extra": "mean: 62.34506577514871 usec\nrounds: 8529" + }, + { + "name": "benchmarks/compile/tensordict_nn_test.py::test_seq_add[compile-overhead]", + "value": 16282.436608309054, + "unit": "iter/sec", + "range": "stddev: 0.000005162117040294003", + "extra": "mean: 61.41586938466521 usec\nrounds: 8215" + }, + { + "name": "benchmarks/compile/tensordict_nn_test.py::test_seq_wrap[eager]", + "value": 2426.657892109809, + "unit": "iter/sec", + "range": "stddev: 0.00002546972680316327", + "extra": "mean: 412.08940215737215 usec\nrounds: 2131" + }, + { + "name": "benchmarks/compile/tensordict_nn_test.py::test_seq_wrap[compile]", + "value": 4205.868547779901, + "unit": "iter/sec", + "range": "stddev: 0.000022000408997498625", + "extra": "mean: 237.76301818273834 usec\nrounds: 3080" + }, + { + "name": "benchmarks/compile/tensordict_nn_test.py::test_seq_wrap[compile-overhead]", + "value": 4277.490857000267, + "unit": "iter/sec", + "range": "stddev: 0.000014130676919252556", + "extra": "mean: 233.78191407784405 usec\nrounds: 3154" + }, + { + "name": "benchmarks/compile/tensordict_nn_test.py::test_func_call_runtime[False-eager]", + "value": 1732.605301101573, + "unit": "iter/sec", + "range": "stddev: 0.000040798347520670584", + "extra": "mean: 577.1654971644206 usec\nrounds: 1587" + }, + { + "name": "benchmarks/compile/tensordict_nn_test.py::test_func_call_runtime[False-compile]", + "value": 2324.1698124268, + "unit": "iter/sec", + "range": "stddev: 0.000017511419004898925", + "extra": "mean: 430.26116020147526 usec\nrounds: 1985" + }, + { + "name": "benchmarks/compile/tensordict_nn_test.py::test_func_call_runtime[False-compile-overhead]", + "value": 2315.1683534431413, + "unit": "iter/sec", + "range": "stddev: 0.00003308012639745543", + "extra": "mean: 431.9340312823429 usec\nrounds: 1918" + }, + { + "name": "benchmarks/compile/tensordict_nn_test.py::test_func_call_runtime[True-eager]", + "value": 1291.8206376093813, + "unit": "iter/sec", + "range": "stddev: 0.000027970793759836046", + "extra": "mean: 774.1012729527073 usec\nrounds: 1220" + }, + { + "name": "benchmarks/compile/tensordict_nn_test.py::test_func_call_runtime[True-compile]", + "value": 2124.420081853823, + "unit": "iter/sec", + "range": "stddev: 0.00003451174390717953", + "extra": "mean: 470.7166951309246 usec\nrounds: 1745" + }, + { + "name": "benchmarks/compile/tensordict_nn_test.py::test_func_call_runtime[True-compile-overhead]", + "value": 2098.19252975123, + "unit": "iter/sec", + "range": "stddev: 0.00002127942836638237", + "extra": "mean: 476.60068645776954 usec\nrounds: 1920" + }, + { + "name": "benchmarks/compile/tensordict_nn_test.py::test_func_call_cm_runtime[False-eager]", + "value": 1736.8291173816722, + "unit": "iter/sec", + "range": "stddev: 0.00003910631301100213", + "extra": "mean: 575.7618812307416 usec\nrounds: 1625" + }, + { + "name": "benchmarks/compile/tensordict_nn_test.py::test_func_call_cm_runtime[False-compile]", + "value": 2314.791657690736, + "unit": "iter/sec", + "range": "stddev: 0.000016564595761502468", + "extra": "mean: 432.004321718358 usec\nrounds: 2095" + }, + { + "name": "benchmarks/compile/tensordict_nn_test.py::test_func_call_cm_runtime[False-compile-overhead]", + "value": 2322.8857501704188, + "unit": "iter/sec", + "range": "stddev: 0.000018801703324158", + "extra": "mean: 430.4990032017868 usec\nrounds: 1874" + }, + { + "name": "benchmarks/compile/tensordict_nn_test.py::test_func_call_cm_runtime[True-eager]", + "value": 1096.7130171437982, + "unit": "iter/sec", + "range": "stddev: 0.000026020330430350946", + "extra": "mean: 911.8155655746016 usec\nrounds: 976" + }, + { + "name": "benchmarks/compile/tensordict_nn_test.py::test_func_call_cm_runtime[True-compile]", + "value": 2012.8665939549996, + "unit": "iter/sec", + "range": "stddev: 0.00001644373518240948", + "extra": "mean: 496.8039128888024 usec\nrounds: 1676" + }, + { + "name": "benchmarks/compile/tensordict_nn_test.py::test_func_call_cm_runtime[True-compile-overhead]", + "value": 1948.5222210456325, + "unit": "iter/sec", + "range": "stddev: 0.00009315100257867165", + "extra": "mean: 513.2094410826742 usec\nrounds: 1519" + }, + { + "name": "benchmarks/compile/tensordict_nn_test.py::test_vmap_func_call_cm_runtime[eager]", + "value": 503.7795378638519, + "unit": "iter/sec", + "range": "stddev: 0.00014752034634264805", + "extra": "mean: 1.984995270431673 msec\nrounds: 514" + }, + { + "name": "benchmarks/compile/tensordict_nn_test.py::test_vmap_func_call_cm_runtime[compile]", + "value": 1919.3393220662829, + "unit": "iter/sec", + "range": "stddev: 0.00001715429568435357", + "extra": "mean: 521.012615384465 usec\nrounds: 1612" + }, + { + "name": "benchmarks/compile/tensordict_nn_test.py::test_vmap_func_call_cm_runtime[compile-overhead]", + "value": 1868.6795874511229, + "unit": "iter/sec", + "range": "stddev: 0.00004152676392041228", + "extra": "mean: 535.1372202679214 usec\nrounds: 1421" + }, + { + "name": "benchmarks/distributed/distributed_benchmark_test.py::test_distributed", + "value": 7666.5754037106335, + "unit": "iter/sec", + "range": "stddev: 0.000011018240051649391", + "extra": "mean: 130.43633530506966 usec\nrounds: 3719" + }, + { + "name": "benchmarks/nn/functional_benchmarks_test.py::test_tdmodule", + "value": 48923.475611997856, + "unit": "iter/sec", + "range": "stddev: 0.000003777777032399383", + "extra": "mean: 20.440084999904684 usec\nrounds: 1000" + }, + { + "name": "benchmarks/nn/functional_benchmarks_test.py::test_tdmodule_dispatch", + "value": 25094.290542588955, + "unit": "iter/sec", + "range": "stddev: 0.0000031763533159285636", + "extra": "mean: 39.84970199906002 usec\nrounds: 1000" + }, + { + "name": "benchmarks/nn/functional_benchmarks_test.py::test_tdseq", + "value": 43029.86165010693, + "unit": "iter/sec", + "range": "stddev: 0.0000022358220412421655", + "extra": "mean: 23.239674998990267 usec\nrounds: 1000" + }, + { + "name": "benchmarks/nn/functional_benchmarks_test.py::test_tdseq_dispatch", + "value": 22084.918808711867, + "unit": "iter/sec", + "range": "stddev: 0.000002725928857155866", + "extra": "mean: 45.27976800193301 usec\nrounds: 1000" + }, + { + "name": "benchmarks/nn/functional_benchmarks_test.py::test_instantiation_functorch", + "value": 655.6353549911597, + "unit": "iter/sec", + "range": "stddev: 0.000039498493874499416", + "extra": "mean: 1.5252380647066899 msec\nrounds: 510" + }, + { + "name": "benchmarks/nn/functional_benchmarks_test.py::test_exec_functorch", + "value": 5540.229988110772, + "unit": "iter/sec", + "range": "stddev: 0.000008120998706276795", + "extra": "mean: 180.49792195377827 usec\nrounds: 3357" + }, + { + "name": "benchmarks/nn/functional_benchmarks_test.py::test_exec_functional_call", + "value": 5725.721567474933, + "unit": "iter/sec", + "range": "stddev: 0.00000857991189851508", + "extra": "mean: 174.6504764885038 usec\nrounds: 3828" + }, + { + "name": "benchmarks/nn/functional_benchmarks_test.py::test_exec_td_decorator", + "value": 4358.263621448938, + "unit": "iter/sec", + "range": "stddev: 0.000012311290491338979", + "extra": "mean: 229.44917674978606 usec\nrounds: 2942" + }, + { + "name": "benchmarks/nn/functional_benchmarks_test.py::test_vmap_mlp_speed_decorator[True-True]", + "value": 1484.432702317553, + "unit": "iter/sec", + "range": "stddev: 0.00005325414269949955", + "extra": "mean: 673.6580233234971 usec\nrounds: 1415" + }, + { + "name": "benchmarks/nn/functional_benchmarks_test.py::test_vmap_mlp_speed_decorator[True-False]", + "value": 1518.3445704126198, + "unit": "iter/sec", + "range": "stddev: 0.00003557194738097202", + "extra": "mean: 658.6120301587692 usec\nrounds: 1459" + }, + { + "name": "benchmarks/nn/functional_benchmarks_test.py::test_vmap_mlp_speed_decorator[False-True]", + "value": 1870.2311853077063, + "unit": "iter/sec", + "range": "stddev: 0.00003081976256186187", + "extra": "mean: 534.6932549600662 usec\nrounds: 1412" + }, + { + "name": "benchmarks/nn/functional_benchmarks_test.py::test_vmap_mlp_speed_decorator[False-False]", + "value": 1871.6193340403256, + "unit": "iter/sec", + "range": "stddev: 0.00002774078387871895", + "extra": "mean: 534.2966819226361 usec\nrounds: 1770" + }, + { + "name": "benchmarks/nn/functional_benchmarks_test.py::test_to_module_speed[True]", + "value": 780.6986138256177, + "unit": "iter/sec", + "range": "stddev: 0.000027949230882443192", + "extra": "mean: 1.2809040291486504 msec\nrounds: 446" + }, + { + "name": "benchmarks/nn/functional_benchmarks_test.py::test_to_module_speed[False]", + "value": 800.3476575753763, + "unit": "iter/sec", + "range": "stddev: 0.000020825345863101615", + "extra": "mean: 1.2494570210019271 msec\nrounds: 619" + }, + { + "name": "benchmarks/tensorclass/test_tensorclass_speed.py::test_tc_init", + "value": 21909.746917118555, + "unit": "iter/sec", + "range": "stddev: 0.000002404107669020803", + "extra": "mean: 45.641786908030355 usec\nrounds: 4247" + }, + { + "name": "benchmarks/tensorclass/test_tensorclass_speed.py::test_tc_init_nested", + "value": 10890.456966441561, + "unit": "iter/sec", + "range": "stddev: 0.000004988208488596765", + "extra": "mean: 91.82351145424417 usec\nrounds: 5457" + }, + { + "name": "benchmarks/tensorclass/test_tensorclass_speed.py::test_tc_first_layer_tensor", + "value": 656763.6990459543, + "unit": "iter/sec", + "range": "stddev: 1.8966625344819204e-7", + "extra": "mean: 1.5226176499289577 usec\nrounds: 131683" + }, + { + "name": "benchmarks/tensorclass/test_tensorclass_speed.py::test_tc_first_layer_nontensor", + "value": 212767.89596223427, + "unit": "iter/sec", + "range": "stddev: 4.5100273902658517e-7", + "extra": "mean: 4.699957178584392 usec\nrounds: 70993" + }, + { + "name": "benchmarks/tensorclass/test_tensorclass_speed.py::test_tc_second_layer_tensor", + "value": 355649.7258584886, + "unit": "iter/sec", + "range": "stddev: 3.129639653416616e-7", + "extra": "mean: 2.8117552954276577 usec\nrounds: 140786" + }, + { + "name": "benchmarks/tensorclass/test_tensorclass_speed.py::test_tc_second_layer_nontensor", + "value": 166323.91125553267, + "unit": "iter/sec", + "range": "stddev: 4.1332792126797024e-7", + "extra": "mean: 6.012364623049565 usec\nrounds: 76191" + }, + { + "name": "benchmarks/tensorclass/test_torch_functions.py::test_unbind", + "value": 76.70275581663044, + "unit": "iter/sec", + "range": "stddev: 0.04619354477160998", + "extra": "mean: 13.037341218751664 msec\nrounds: 64" + }, + { + "name": "benchmarks/tensorclass/test_torch_functions.py::test_full_like", + "value": 137.07803979714083, + "unit": "iter/sec", + "range": "stddev: 0.00027735223676556925", + "extra": "mean: 7.295114530962661 msec\nrounds: 113" + }, + { + "name": "benchmarks/tensorclass/test_torch_functions.py::test_zeros_like", + "value": 155.11934836915347, + "unit": "iter/sec", + "range": "stddev: 0.0004074149183438684", + "extra": "mean: 6.446649051285318 msec\nrounds: 156" + }, + { + "name": "benchmarks/tensorclass/test_torch_functions.py::test_ones_like", + "value": 127.89484235498482, + "unit": "iter/sec", + "range": "stddev: 0.0006299827020086482", + "extra": "mean: 7.818923590557317 msec\nrounds: 127" + }, + { + "name": "benchmarks/tensorclass/test_torch_functions.py::test_clone", + "value": 107.61539503779638, + "unit": "iter/sec", + "range": "stddev: 0.0004738948940913407", + "extra": "mean: 9.292350779819028 msec\nrounds: 109" + }, + { + "name": "benchmarks/tensorclass/test_torch_functions.py::test_squeeze", + "value": 84826.87363799204, + "unit": "iter/sec", + "range": "stddev: 0.0000011480947709714305", + "extra": "mean: 11.788716913788539 usec\nrounds: 15709" + }, + { + "name": "benchmarks/tensorclass/test_torch_functions.py::test_unsqueeze", + "value": 11108.669001833801, + "unit": "iter/sec", + "range": "stddev: 0.000006436709412325544", + "extra": "mean: 90.01978543378344 usec\nrounds: 4064" + }, + { + "name": "benchmarks/tensorclass/test_torch_functions.py::test_split", + "value": 5303.847755739249, + "unit": "iter/sec", + "range": "stddev: 0.00002086904707020904", + "extra": "mean: 188.54236510048926 usec\nrounds: 2980" + }, + { + "name": "benchmarks/tensorclass/test_torch_functions.py::test_permute", + "value": 4523.0806537909675, + "unit": "iter/sec", + "range": "stddev: 0.00002259809519483744", + "extra": "mean: 221.0882530166385 usec\nrounds: 2154" + }, + { + "name": "benchmarks/tensorclass/test_torch_functions.py::test_stack", + "value": 38.354242934680954, + "unit": "iter/sec", + "range": "stddev: 0.004914740881902125", + "extra": "mean: 26.072734682914902 msec\nrounds: 41" + }, + { + "name": "benchmarks/tensorclass/test_torch_functions.py::test_cat", + "value": 41.00894729776866, + "unit": "iter/sec", + "range": "stddev: 0.0008599506323875732", + "extra": "mean: 24.384922459455844 msec\nrounds: 37" + } + ] } ], "GPU Benchmark Results": [