diff --git a/dev/bench/data.js b/dev/bench/data.js index bb6b9d004..42144557d 100644 --- a/dev/bench/data.js +++ b/dev/bench/data.js @@ -1,5 +1,5 @@ window.BENCHMARK_DATA = { - "lastUpdate": 1701698328822, + "lastUpdate": 1701698460733, "repoUrl": "https://github.com/pytorch/tensordict", "entries": { "CPU Benchmark Results": [ @@ -227329,6 +227329,919 @@ window.BENCHMARK_DATA = { "extra": "mean: 20.293646140344208 msec\nrounds: 50" } ] + }, + { + "commit": { + "author": { + "email": "vmoens@meta.com", + "name": "Vincent Moens", + "username": "vmoens" + }, + "committer": { + "email": "noreply@github.com", + "name": "GitHub", + "username": "web-flow" + }, + "distinct": true, + "id": "a25b22b0e7856c6e277bd552b67b76e790a816d3", + "message": "[BugFix] Fix non-blocking arg in copy_ (#590)", + "timestamp": "2023-12-04T13:54:35Z", + "tree_id": "5c51e3d43c69c027c01f25fe13e0d577a4a40f0b", + "url": "https://github.com/pytorch/tensordict/commit/a25b22b0e7856c6e277bd552b67b76e790a816d3" + }, + "date": 1701698458312, + "tool": "pytest", + "benches": [ + { + "name": "benchmarks/common/common_ops_test.py::test_plain_set_nested", + "value": 78437.30748079442, + "unit": "iter/sec", + "range": "stddev: 7.994454177425739e-7", + "extra": "mean: 12.749035275654414 usec\nrounds: 19275" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_plain_set_stack_nested", + "value": 8171.059242216651, + "unit": "iter/sec", + "range": "stddev: 0.00001516009925620079", + "extra": "mean: 122.38315380622784 usec\nrounds: 26" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_plain_set_nested_inplace", + "value": 70777.21352167318, + "unit": "iter/sec", + "range": "stddev: 7.282118760239931e-7", + "extra": "mean: 14.128841052689692 usec\nrounds: 48217" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_plain_set_stack_nested_inplace", + "value": 6768.082375290409, + "unit": "iter/sec", + "range": "stddev: 0.000003273479619072119", + "extra": "mean: 147.75233877928255 usec\nrounds: 5074" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_items", + "value": 214458.7045960396, + "unit": "iter/sec", + "range": "stddev: 3.234078356712968e-7", + "extra": "mean: 4.662902361009911 usec\nrounds: 128535" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_items_nested", + "value": 2956.474568318275, + "unit": "iter/sec", + "range": "stddev: 0.000004157184028006808", + "extra": "mean: 338.2406906915583 usec\nrounds: 2719" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_items_nested_locked", + "value": 2934.087133392178, + "unit": "iter/sec", + "range": "stddev: 0.000004879296737467311", + "extra": "mean: 340.82150752076427 usec\nrounds: 2857" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_items_nested_leaf", + "value": 4998.668834723918, + "unit": "iter/sec", + "range": "stddev: 0.000003602880889331505", + "extra": "mean: 200.05326079082633 usec\nrounds: 4751" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_items_stack_nested", + "value": 665.9071182556547, + "unit": "iter/sec", + "range": "stddev: 0.00001702296824492105", + "extra": "mean: 1.5017109332297007 msec\nrounds: 554" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_items_stack_nested_leaf", + "value": 766.9821966442124, + "unit": "iter/sec", + "range": "stddev: 0.000013762285190132884", + "extra": "mean: 1.303811228442216 msec\nrounds: 731" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_items_stack_nested_locked", + "value": 1191.778762723208, + "unit": "iter/sec", + "range": "stddev: 0.0000339391396389079", + "extra": "mean: 839.0819095609704 usec\nrounds: 1161" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_keys", + "value": 220182.529764498, + "unit": "iter/sec", + "range": "stddev: 2.9309597753251687e-7", + "extra": "mean: 4.541686395689868 usec\nrounds: 112234" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_keys_nested", + "value": 10965.990328590986, + "unit": "iter/sec", + "range": "stddev: 0.000006827411279608089", + "extra": "mean: 91.19103428285528 usec\nrounds: 8283" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_keys_nested_locked", + "value": 11056.636484180763, + "unit": "iter/sec", + "range": "stddev: 0.000001790937866480385", + "extra": "mean: 90.44341843296972 usec\nrounds: 10446" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_keys_nested_leaf", + "value": 12030.245999798864, + "unit": "iter/sec", + "range": "stddev: 0.000002989102978668293", + "extra": "mean: 83.12381974705414 usec\nrounds: 10657" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_keys_stack_nested", + "value": 780.0673449485245, + "unit": "iter/sec", + "range": "stddev: 0.000012955202434037268", + "extra": "mean: 1.2819405997132063 msec\nrounds: 712" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_keys_stack_nested_leaf", + "value": 784.9197359807504, + "unit": "iter/sec", + "range": "stddev: 0.000012455192694473352", + "extra": "mean: 1.2740156147946882 msec\nrounds: 784" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_keys_stack_nested_locked", + "value": 1579.763358408855, + "unit": "iter/sec", + "range": "stddev: 0.000008394436343125187", + "extra": "mean: 633.0061997432352 usec\nrounds: 1542" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_values", + "value": 526328.7303306749, + "unit": "iter/sec", + "range": "stddev: 1.0225137489774525e-7", + "extra": "mean: 1.899953284654721 usec\nrounds: 163399" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_values_nested", + "value": 23003.268106957632, + "unit": "iter/sec", + "range": "stddev: 0.0000012643219428011006", + "extra": "mean: 43.472083851317514 usec\nrounds: 16565" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_values_nested_locked", + "value": 21709.427965390256, + "unit": "iter/sec", + "range": "stddev: 0.0000012258694804562209", + "extra": "mean: 46.06293641611499 usec\nrounds: 19897" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_values_nested_leaf", + "value": 26428.57480857615, + "unit": "iter/sec", + "range": "stddev: 0.0000010491878516070282", + "extra": "mean: 37.83783299867903 usec\nrounds: 21515" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_values_stack_nested", + "value": 876.0480923640239, + "unit": "iter/sec", + "range": "stddev: 0.000014542366585560243", + "extra": "mean: 1.141489843669987 msec\nrounds: 774" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_values_stack_nested_leaf", + "value": 898.6766550400838, + "unit": "iter/sec", + "range": "stddev: 0.000012461867439000051", + "extra": "mean: 1.112747276110557 msec\nrounds: 862" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_values_stack_nested_locked", + "value": 1945.0853805392665, + "unit": "iter/sec", + "range": "stddev: 0.000008146621423471252", + "extra": "mean: 514.1162490886412 usec\nrounds: 1879" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_membership", + "value": 1046204.4741050876, + "unit": "iter/sec", + "range": "stddev: 6.193399386687573e-8", + "extra": "mean: 955.8360958598505 nsec\nrounds: 167505" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_membership_nested", + "value": 470098.7874043673, + "unit": "iter/sec", + "range": "stddev: 1.5568256220078236e-7", + "extra": "mean: 2.127212464259826 usec\nrounds: 183151" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_membership_nested_leaf", + "value": 472761.55528470885, + "unit": "iter/sec", + "range": "stddev: 1.562783886154556e-7", + "extra": "mean: 2.115231217136036 usec\nrounds: 187970" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_membership_stacked_nested", + "value": 91924.35667891623, + "unit": "iter/sec", + "range": "stddev: 5.620981608809637e-7", + "extra": "mean: 10.878509636928033 usec\nrounds: 32227" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_membership_stacked_nested_leaf", + "value": 91919.58458390833, + "unit": "iter/sec", + "range": "stddev: 5.693296258951259e-7", + "extra": "mean: 10.879074405380443 usec\nrounds: 57307" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_membership_nested_last", + "value": 216679.65116118285, + "unit": "iter/sec", + "range": "stddev: 3.449176564555595e-7", + "extra": "mean: 4.6151080391768025 usec\nrounds: 110988" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_membership_nested_leaf_last", + "value": 215450.7224080803, + "unit": "iter/sec", + "range": "stddev: 3.523050665784156e-7", + "extra": "mean: 4.64143256900259 usec\nrounds: 125157" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_membership_stacked_nested_last", + "value": 7351.411971078304, + "unit": "iter/sec", + "range": "stddev: 0.000002580802677873314", + "extra": "mean: 136.0282900664755 usec\nrounds: 6409" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_membership_stacked_nested_leaf_last", + "value": 78521.44819779783, + "unit": "iter/sec", + "range": "stddev: 6.63450942357982e-7", + "extra": "mean: 12.735373874931225 usec\nrounds: 46211" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_nested_getleaf", + "value": 114507.65363096276, + "unit": "iter/sec", + "range": "stddev: 4.2161124794152524e-7", + "extra": "mean: 8.733040703312437 usec\nrounds: 90901" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_nested_get", + "value": 121162.68696254937, + "unit": "iter/sec", + "range": "stddev: 3.996583971222008e-7", + "extra": "mean: 8.253365991372357 usec\nrounds: 97838" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_stacked_getleaf", + "value": 1781.6525583629432, + "unit": "iter/sec", + "range": "stddev: 0.000008458911967920671", + "extra": "mean: 561.2766615500173 usec\nrounds: 1625" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_stacked_get", + "value": 1896.5114946441777, + "unit": "iter/sec", + "range": "stddev: 0.0000066914447584017324", + "extra": "mean: 527.28391197419 usec\nrounds: 1829" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_nested_getitemleaf", + "value": 113709.38067630203, + "unit": "iter/sec", + "range": "stddev: 4.258963343894486e-7", + "extra": "mean: 8.794349191353993 usec\nrounds: 77640" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_nested_getitem", + "value": 120675.75764225211, + "unit": "iter/sec", + "range": "stddev: 4.089769844372721e-7", + "extra": "mean: 8.286668503582453 usec\nrounds: 92851" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_stacked_getitemleaf", + "value": 1770.2308052488156, + "unit": "iter/sec", + "range": "stddev: 0.000007674778719425051", + "extra": "mean: 564.8980895795928 usec\nrounds: 1652" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_stacked_getitem", + "value": 1875.8739001224174, + "unit": "iter/sec", + "range": "stddev: 0.000007209716452163084", + "extra": "mean: 533.0848731008738 usec\nrounds: 1836" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_lock_nested", + "value": 1783.7922558705682, + "unit": "iter/sec", + "range": "stddev: 0.0003922099013848021", + "extra": "mean: 560.6033980184293 usec\nrounds: 1000" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_lock_stack_nested", + "value": 135.7920353822932, + "unit": "iter/sec", + "range": "stddev: 0.013238064644635842", + "extra": "mean: 7.364202157988984 msec\nrounds: 1000" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_unlock_nested", + "value": 2331.080897706877, + "unit": "iter/sec", + "range": "stddev: 0.00011076280135199418", + "extra": "mean: 428.9855409924712 usec\nrounds: 1000" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_unlock_stack_nested", + "value": 161.44881724957727, + "unit": "iter/sec", + "range": "stddev: 0.00990872284233495", + "extra": "mean: 6.193913445981707 msec\nrounds: 1000" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_flatten_speed", + "value": 5295.2091845438335, + "unit": "iter/sec", + "range": "stddev: 0.000010983198674549136", + "extra": "mean: 188.84995193747895 usec\nrounds: 4369" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_unflatten_speed", + "value": 2702.5882845767424, + "unit": "iter/sec", + "range": "stddev: 0.00000677313274476646", + "extra": "mean: 370.0156645045962 usec\nrounds: 2632" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_common_ops", + "value": 1614.8120547096003, + "unit": "iter/sec", + "range": "stddev: 0.00007096828627130187", + "extra": "mean: 619.2671135216631 usec\nrounds: 1101" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_creation", + "value": 474204.902596119, + "unit": "iter/sec", + "range": "stddev: 2.7751594528559015e-7", + "extra": "mean: 2.1087930439464513 usec\nrounds: 116145" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_creation_empty", + "value": 150196.6847170591, + "unit": "iter/sec", + "range": "stddev: 5.566466623420341e-7", + "extra": "mean: 6.657936570862416 usec\nrounds: 43403" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_creation_nested_1", + "value": 111180.2141749059, + "unit": "iter/sec", + "range": "stddev: 6.148005208136925e-7", + "extra": "mean: 8.994406130814115 usec\nrounds: 42053" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_creation_nested_2", + "value": 85662.77871003316, + "unit": "iter/sec", + "range": "stddev: 7.323211702737149e-7", + "extra": "mean: 11.67368155759902 usec\nrounds: 35702" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_clone", + "value": 67423.8008657284, + "unit": "iter/sec", + "range": "stddev: 0.0000011454361007558216", + "extra": "mean: 14.831557805402532 usec\nrounds: 18478" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_getitem[int]", + "value": 81942.35423965906, + "unit": "iter/sec", + "range": "stddev: 7.800431727439642e-7", + "extra": "mean: 12.203701117437662 usec\nrounds: 18034" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_getitem[slice_int]", + "value": 42259.316757646695, + "unit": "iter/sec", + "range": "stddev: 0.0000015096199375384041", + "extra": "mean: 23.663420914609393 usec\nrounds: 14029" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_getitem[range]", + "value": 22818.41751906278, + "unit": "iter/sec", + "range": "stddev: 0.0000028403480550592344", + "extra": "mean: 43.824248511737856 usec\nrounds: 6209" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_getitem[tuple]", + "value": 49492.20997692378, + "unit": "iter/sec", + "range": "stddev: 0.0000013053023954507273", + "extra": "mean: 20.20519997927471 usec\nrounds: 22563" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_getitem[list]", + "value": 25179.544671505744, + "unit": "iter/sec", + "range": "stddev: 0.0000035864612414432614", + "extra": "mean: 39.71477693683806 usec\nrounds: 13476" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_setitem_dim[int]", + "value": 37643.795057156996, + "unit": "iter/sec", + "range": "stddev: 0.0000015629851500853591", + "extra": "mean: 26.56480300356634 usec\nrounds: 1000" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_setitem_dim[slice_int]", + "value": 21159.444464022137, + "unit": "iter/sec", + "range": "stddev: 0.0000022413026944654584", + "extra": "mean: 47.26021997885255 usec\nrounds: 1000" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_setitem_dim[range]", + "value": 15267.880460186892, + "unit": "iter/sec", + "range": "stddev: 0.000002800735261967266", + "extra": "mean: 65.49697599530191 usec\nrounds: 1000" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_setitem_dim[tuple]", + "value": 24964.68058413134, + "unit": "iter/sec", + "range": "stddev: 0.000002298162137029405", + "extra": "mean: 40.05659101585479 usec\nrounds: 1000" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_setitem", + "value": 52938.55870014419, + "unit": "iter/sec", + "range": "stddev: 0.000001872767187712049", + "extra": "mean: 18.88982292971411 usec\nrounds: 23725" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_set", + "value": 54833.26757263804, + "unit": "iter/sec", + "range": "stddev: 0.0000018025735021858887", + "extra": "mean: 18.237103938321614 usec\nrounds: 25323" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_set_shared", + "value": 8133.781525652262, + "unit": "iter/sec", + "range": "stddev: 0.0008329197394793035", + "extra": "mean: 122.94404476518176 usec\nrounds: 5138" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_update", + "value": 49270.76586300575, + "unit": "iter/sec", + "range": "stddev: 0.000002089146667771516", + "extra": "mean: 20.296010879563692 usec\nrounds: 29146" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_update_nested", + "value": 36886.52962706479, + "unit": "iter/sec", + "range": "stddev: 0.0000021911318519974818", + "extra": "mean: 27.110167589912525 usec\nrounds: 25031" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_set_nested", + "value": 49639.70551439531, + "unit": "iter/sec", + "range": "stddev: 0.0000019348292901182045", + "extra": "mean: 20.145163828782266 usec\nrounds: 22066" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_set_nested_new", + "value": 40692.34474768933, + "unit": "iter/sec", + "range": "stddev: 0.000002020856986014747", + "extra": "mean: 24.574646808888645 usec\nrounds: 20496" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_select", + "value": 20645.730579953284, + "unit": "iter/sec", + "range": "stddev: 0.0000028330851530678264", + "extra": "mean: 48.43616437439061 usec\nrounds: 10689" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_to", + "value": 17213.70382835163, + "unit": "iter/sec", + "range": "stddev: 0.000009603443546007224", + "extra": "mean: 58.09325000427634 usec\nrounds: 8" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_to_nonblocking", + "value": 26732.84735545586, + "unit": "iter/sec", + "range": "stddev: 0.0000023564487686487704", + "extra": "mean: 37.407163805015024 usec\nrounds: 13174" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_unbind_speed", + "value": 2818.212020715407, + "unit": "iter/sec", + "range": "stddev: 0.00000878141348267916", + "extra": "mean: 354.83490690176984 usec\nrounds: 2320" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_unbind_speed_stack0", + "value": 246.67415404707108, + "unit": "iter/sec", + "range": "stddev: 0.0036339130914563407", + "extra": "mean: 4.053931000039741 msec\nrounds: 212" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_unbind_speed_stack1", + "value": 1866970.5218485354, + "unit": "iter/sec", + "range": "stddev: 2.4023951323020675e-8", + "extra": "mean: 535.6270965704001 nsec\nrounds: 87720" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_split", + "value": 564.7275415772132, + "unit": "iter/sec", + "range": "stddev: 0.0023482132715134415", + "extra": "mean: 1.7707654158448256 msec\nrounds: 493" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_chunk", + "value": 572.2257996724624, + "unit": "iter/sec", + "range": "stddev: 0.0021482954828925377", + "extra": "mean: 1.74756189003081 msec\nrounds: 582" + }, + { + "name": "benchmarks/common/memmap_benchmarks_test.py::test_creation[device0]", + "value": 3238.649139040747, + "unit": "iter/sec", + "range": "stddev: 0.000011890066892945103", + "extra": "mean: 308.7707118209752 usec\nrounds: 1742" + }, + { + "name": "benchmarks/common/memmap_benchmarks_test.py::test_creation[device1]", + "value": 3190.8833954304073, + "unit": "iter/sec", + "range": "stddev: 0.000012849441363578408", + "extra": "mean: 313.39283705323663 usec\nrounds: 2295" + }, + { + "name": "benchmarks/common/memmap_benchmarks_test.py::test_creation_from_tensor", + "value": 2908.867949596628, + "unit": "iter/sec", + "range": "stddev: 0.000012469126250964614", + "extra": "mean: 343.77634781897535 usec\nrounds: 1564" + }, + { + "name": "benchmarks/common/memmap_benchmarks_test.py::test_add_one[memmap_tensor0]", + "value": 37772.294789715634, + "unit": "iter/sec", + "range": "stddev: 0.0000021252211873605623", + "extra": "mean: 26.47443067907732 usec\nrounds: 5972" + }, + { + "name": "benchmarks/common/memmap_benchmarks_test.py::test_add_one[memmap_tensor1]", + "value": 13288.148714001518, + "unit": "iter/sec", + "range": "stddev: 0.000015690559576695738", + "extra": "mean: 75.255027733571 usec\nrounds: 72" + }, + { + "name": "benchmarks/common/memmap_benchmarks_test.py::test_contiguous[memmap_tensor0]", + "value": 165509.97459968348, + "unit": "iter/sec", + "range": "stddev: 5.26559094963424e-7", + "extra": "mean: 6.041931928384892 usec\nrounds: 46553" + }, + { + "name": "benchmarks/common/memmap_benchmarks_test.py::test_contiguous[memmap_tensor1]", + "value": 43219.36314504978, + "unit": "iter/sec", + "range": "stddev: 0.000001596012333557861", + "extra": "mean: 23.13777731161541 usec\nrounds: 17886" + }, + { + "name": "benchmarks/common/memmap_benchmarks_test.py::test_stack[memmap_tensor0]", + "value": 46603.52402725342, + "unit": "iter/sec", + "range": "stddev: 0.0000015302708518777697", + "extra": "mean: 21.457604781458308 usec\nrounds: 13795" + }, + { + "name": "benchmarks/common/memmap_benchmarks_test.py::test_stack[memmap_tensor1]", + "value": 12622.478996690405, + "unit": "iter/sec", + "range": "stddev: 0.000008704778034663363", + "extra": "mean: 79.22374046034844 usec\nrounds: 131" + }, + { + "name": "benchmarks/common/memmap_benchmarks_test.py::test_memmaptd_index", + "value": 4101.310985292997, + "unit": "iter/sec", + "range": "stddev: 0.000005566959866894971", + "extra": "mean: 243.8244755362193 usec\nrounds: 2166" + }, + { + "name": "benchmarks/common/memmap_benchmarks_test.py::test_memmaptd_index_astensor", + "value": 3330.118028150274, + "unit": "iter/sec", + "range": "stddev: 0.000007695692942900346", + "extra": "mean: 300.28965686704316 usec\nrounds: 2926" + }, + { + "name": "benchmarks/common/memmap_benchmarks_test.py::test_memmaptd_index_op", + "value": 1729.8275370260585, + "unit": "iter/sec", + "range": "stddev: 0.000015204156079429455", + "extra": "mean: 578.0923118608764 usec\nrounds: 1552" + }, + { + "name": "benchmarks/common/pytree_benchmarks_test.py::test_reshape_pytree", + "value": 47386.030293707736, + "unit": "iter/sec", + "range": "stddev: 0.0000011251243691577144", + "extra": "mean: 21.10326595838072 usec\nrounds: 12611" + }, + { + "name": "benchmarks/common/pytree_benchmarks_test.py::test_reshape_td", + "value": 32885.54499703288, + "unit": "iter/sec", + "range": "stddev: 0.0000016963817264867057", + "extra": "mean: 30.40849710990728 usec\nrounds: 10197" + }, + { + "name": "benchmarks/common/pytree_benchmarks_test.py::test_view_pytree", + "value": 48166.37145749196, + "unit": "iter/sec", + "range": "stddev: 0.0000010715290771129283", + "extra": "mean: 20.761372919330768 usec\nrounds: 22702" + }, + { + "name": "benchmarks/common/pytree_benchmarks_test.py::test_view_td", + "value": 244665.49489308023, + "unit": "iter/sec", + "range": "stddev: 3.5609128045840565e-7", + "extra": "mean: 4.087213035238189 usec\nrounds: 36482" + }, + { + "name": "benchmarks/common/pytree_benchmarks_test.py::test_unbind_pytree", + "value": 38689.13422495437, + "unit": "iter/sec", + "range": "stddev: 0.00000120356904822742", + "extra": "mean: 25.847050341979564 usec\nrounds: 19728" + }, + { + "name": "benchmarks/common/pytree_benchmarks_test.py::test_unbind_td", + "value": 17618.13927731671, + "unit": "iter/sec", + "range": "stddev: 0.0000021200094044975347", + "extra": "mean: 56.75968297557373 usec\nrounds: 11324" + }, + { + "name": "benchmarks/common/pytree_benchmarks_test.py::test_split_pytree", + "value": 40392.64112814329, + "unit": "iter/sec", + "range": "stddev: 0.0000014551203184711374", + "extra": "mean: 24.756984739560817 usec\nrounds: 11729" + }, + { + "name": "benchmarks/common/pytree_benchmarks_test.py::test_split_td", + "value": 22597.494321764334, + "unit": "iter/sec", + "range": "stddev: 0.0000019925349509302424", + "extra": "mean: 44.252693938587235 usec\nrounds: 12759" + }, + { + "name": "benchmarks/common/pytree_benchmarks_test.py::test_add_pytree", + "value": 30876.870904687785, + "unit": "iter/sec", + "range": "stddev: 0.0000016246780061106978", + "extra": "mean: 32.386701459705826 usec\nrounds: 14035" + }, + { + "name": "benchmarks/common/pytree_benchmarks_test.py::test_add_td", + "value": 21569.119549138908, + "unit": "iter/sec", + "range": "stddev: 0.0000023674003797054753", + "extra": "mean: 46.36257858007572 usec\nrounds: 12752" + }, + { + "name": "benchmarks/distributed/distributed_benchmark_test.py::test_distributed", + "value": 180166.22198193162, + "unit": "iter/sec", + "range": "stddev: 4.277729852547084e-7", + "extra": "mean: 5.550429980711297 usec\nrounds: 17059" + }, + { + "name": "benchmarks/nn/functional_benchmarks_test.py::test_tdmodule", + "value": 59063.26372127283, + "unit": "iter/sec", + "range": "stddev: 0.0000011904045272164437", + "extra": "mean: 16.930998001043918 usec\nrounds: 1000" + }, + { + "name": "benchmarks/nn/functional_benchmarks_test.py::test_tdmodule_dispatch", + "value": 30129.873008857834, + "unit": "iter/sec", + "range": "stddev: 0.000014317946807037491", + "extra": "mean: 33.18965200105595 usec\nrounds: 1000" + }, + { + "name": "benchmarks/nn/functional_benchmarks_test.py::test_tdseq", + "value": 50111.32729024038, + "unit": "iter/sec", + "range": "stddev: 0.0000015358404021485793", + "extra": "mean: 19.95556801375642 usec\nrounds: 1000" + }, + { + "name": "benchmarks/nn/functional_benchmarks_test.py::test_tdseq_dispatch", + "value": 27468.643367518434, + "unit": "iter/sec", + "range": "stddev: 0.000001617540808764401", + "extra": "mean: 36.40514701146458 usec\nrounds: 1000" + }, + { + "name": "benchmarks/nn/functional_benchmarks_test.py::test_instantiation_functorch", + "value": 584.7157844788383, + "unit": "iter/sec", + "range": "stddev: 0.000022966180816875067", + "extra": "mean: 1.7102326062418645 msec\nrounds: 480" + }, + { + "name": "benchmarks/nn/functional_benchmarks_test.py::test_instantiation_td", + "value": 842.268798533005, + "unit": "iter/sec", + "range": "stddev: 0.00010546583237700415", + "extra": "mean: 1.1872694343441408 msec\nrounds: 815" + }, + { + "name": "benchmarks/nn/functional_benchmarks_test.py::test_exec_functorch", + "value": 6113.046396422752, + "unit": "iter/sec", + "range": "stddev: 0.000004038785319524301", + "extra": "mean: 163.58455917906699 usec\nrounds: 3017" + }, + { + "name": "benchmarks/nn/functional_benchmarks_test.py::test_exec_functional_call", + "value": 6166.648810933122, + "unit": "iter/sec", + "range": "stddev: 0.000004698710488230567", + "extra": "mean: 162.16263170801233 usec\nrounds: 4157" + }, + { + "name": "benchmarks/nn/functional_benchmarks_test.py::test_exec_td", + "value": 6560.555956938824, + "unit": "iter/sec", + "range": "stddev: 0.000004675098017569727", + "extra": "mean: 152.42610634885938 usec\nrounds: 2614" + }, + { + "name": "benchmarks/nn/functional_benchmarks_test.py::test_exec_td_decorator", + "value": 5311.47393567739, + "unit": "iter/sec", + "range": "stddev: 0.00005539804589457992", + "extra": "mean: 188.27165719160524 usec\nrounds: 3976" + }, + { + "name": "benchmarks/nn/functional_benchmarks_test.py::test_vmap_mlp_speed[True-True]", + "value": 925.7621705754688, + "unit": "iter/sec", + "range": "stddev: 0.00001754049484184369", + "extra": "mean: 1.0801910380269522 msec\nrounds: 815" + }, + { + "name": "benchmarks/nn/functional_benchmarks_test.py::test_vmap_mlp_speed[True-False]", + "value": 1622.9839852087246, + "unit": "iter/sec", + "range": "stddev: 0.000009539137389666402", + "extra": "mean: 616.1490249525749 usec\nrounds: 1523" + }, + { + "name": "benchmarks/nn/functional_benchmarks_test.py::test_vmap_mlp_speed[False-True]", + "value": 1014.2985224409654, + "unit": "iter/sec", + "range": "stddev: 0.000012674861398712025", + "extra": "mean: 985.9030432120169 usec\nrounds: 995" + }, + { + "name": "benchmarks/nn/functional_benchmarks_test.py::test_vmap_mlp_speed[False-False]", + "value": 1820.9463704938614, + "unit": "iter/sec", + "range": "stddev: 0.000008320278384715101", + "extra": "mean: 549.1649925575724 usec\nrounds: 1750" + }, + { + "name": "benchmarks/nn/functional_benchmarks_test.py::test_vmap_mlp_speed_decorator[True-True]", + "value": 489.75757734264647, + "unit": "iter/sec", + "range": "stddev: 0.00007602282595191556", + "extra": "mean: 2.04182650001222 msec\nrounds: 486" + }, + { + "name": "benchmarks/nn/functional_benchmarks_test.py::test_vmap_mlp_speed_decorator[True-False]", + "value": 1515.5282630232641, + "unit": "iter/sec", + "range": "stddev: 0.000044647746894331554", + "extra": "mean: 659.8359294238048 usec\nrounds: 1516" + }, + { + "name": "benchmarks/nn/functional_benchmarks_test.py::test_vmap_mlp_speed_decorator[False-True]", + "value": 564.553476375117, + "unit": "iter/sec", + "range": "stddev: 0.00006275568956451099", + "extra": "mean: 1.7713113847439155 msec\nrounds: 564" + }, + { + "name": "benchmarks/nn/functional_benchmarks_test.py::test_vmap_mlp_speed_decorator[False-False]", + "value": 1774.076307856702, + "unit": "iter/sec", + "range": "stddev: 0.000041208229440625735", + "extra": "mean: 563.6736117670838 usec\nrounds: 1785" + }, + { + "name": "benchmarks/nn/functional_benchmarks_test.py::test_vmap_transformer_speed[True-True]", + "value": 79.20092296097073, + "unit": "iter/sec", + "range": "stddev: 0.00006198565382266198", + "extra": "mean: 12.626115487224663 msec\nrounds: 78" + }, + { + "name": "benchmarks/nn/functional_benchmarks_test.py::test_vmap_transformer_speed[True-False]", + "value": 120.39712642997077, + "unit": "iter/sec", + "range": "stddev: 0.000027931500062427106", + "extra": "mean: 8.305846075002895 msec\nrounds: 120" + }, + { + "name": "benchmarks/nn/functional_benchmarks_test.py::test_vmap_transformer_speed[False-True]", + "value": 79.60047867036927, + "unit": "iter/sec", + "range": "stddev: 0.00005478238955613421", + "extra": "mean: 12.562738524991346 msec\nrounds: 80" + }, + { + "name": "benchmarks/nn/functional_benchmarks_test.py::test_vmap_transformer_speed[False-False]", + "value": 121.42876786903199, + "unit": "iter/sec", + "range": "stddev: 0.000021953673720273924", + "extra": "mean: 8.235280795062982 msec\nrounds: 122" + }, + { + "name": "benchmarks/nn/functional_benchmarks_test.py::test_vmap_transformer_speed_decorator[True-True]", + "value": 15.361842133081707, + "unit": "iter/sec", + "range": "stddev: 0.00038290764560047183", + "extra": "mean: 65.09635962515858 msec\nrounds: 8" + }, + { + "name": "benchmarks/nn/functional_benchmarks_test.py::test_vmap_transformer_speed_decorator[True-False]", + "value": 49.58132891218457, + "unit": "iter/sec", + "range": "stddev: 0.0005074893599124567", + "extra": "mean: 20.168882560028578 msec\nrounds: 50" + }, + { + "name": "benchmarks/nn/functional_benchmarks_test.py::test_vmap_transformer_speed_decorator[False-True]", + "value": 16.96896852485491, + "unit": "iter/sec", + "range": "stddev: 0.00038926449700210376", + "extra": "mean: 58.93110111762379 msec\nrounds: 17" + }, + { + "name": "benchmarks/nn/functional_benchmarks_test.py::test_vmap_transformer_speed_decorator[False-False]", + "value": 46.63893053915683, + "unit": "iter/sec", + "range": "stddev: 0.011999933710217207", + "extra": "mean: 21.441314979562534 msec\nrounds: 49" + } + ] } ] }