diff --git a/dev/bench/data.js b/dev/bench/data.js index 1db5a473d..95b39dfc5 100644 --- a/dev/bench/data.js +++ b/dev/bench/data.js @@ -1,5 +1,5 @@ window.BENCHMARK_DATA = { - "lastUpdate": 1700563223654, + "lastUpdate": 1700564383858, "repoUrl": "https://github.com/pytorch/tensordict", "entries": { "CPU Benchmark Results": [ @@ -138078,6 +138078,779 @@ window.BENCHMARK_DATA = { "extra": "mean: 376.53617194451954 usec\nrounds: 2495" } ] + }, + { + "commit": { + "author": { + "email": "vmoens@meta.com", + "name": "Vincent Moens", + "username": "vmoens" + }, + "committer": { + "email": "noreply@github.com", + "name": "GitHub", + "username": "web-flow" + }, + "distinct": true, + "id": "3689afaab850b3dd175449c5bac5f2ea8f880d24", + "message": "[Performance] Faster split, chunk and unbind (#563)", + "timestamp": "2023-11-21T10:55:39Z", + "tree_id": "75075b1ef7e24ec97f15576aa73ded1f8d30f3e9", + "url": "https://github.com/pytorch/tensordict/commit/3689afaab850b3dd175449c5bac5f2ea8f880d24" + }, + "date": 1700564379416, + "tool": "pytest", + "benches": [ + { + "name": "benchmarks/common/common_ops_test.py::test_plain_set_nested", + "value": 61617.40998992074, + "unit": "iter/sec", + "range": "stddev: 9.209384807739045e-7", + "extra": "mean: 16.229179385559668 usec\nrounds: 3774" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_plain_set_stack_nested", + "value": 6840.9142124872415, + "unit": "iter/sec", + "range": "stddev: 0.000004360109231908391", + "extra": "mean: 146.1792925534169 usec\nrounds: 1504" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_plain_set_nested_inplace", + "value": 52466.97053186901, + "unit": "iter/sec", + "range": "stddev: 0.0000010278399524044853", + "extra": "mean: 19.05961007206599 usec\nrounds: 13205" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_plain_set_stack_nested_inplace", + "value": 5743.843704491087, + "unit": "iter/sec", + "range": "stddev: 0.000015293902350011525", + "extra": "mean: 174.099444805245 usec\nrounds: 4928" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_items", + "value": 408424.80290379975, + "unit": "iter/sec", + "range": "stddev: 1.8591575437083456e-7", + "extra": "mean: 2.4484311258529017 usec\nrounds: 107435" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_items_nested", + "value": 3739.785188569936, + "unit": "iter/sec", + "range": "stddev: 0.00001031112002902211", + "extra": "mean: 267.3950373022339 usec\nrounds: 3351" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_items_nested_locked", + "value": 3735.405319421855, + "unit": "iter/sec", + "range": "stddev: 0.000004682859261550644", + "extra": "mean: 267.70856560079386 usec\nrounds: 3628" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_items_nested_leaf", + "value": 6064.548349083536, + "unit": "iter/sec", + "range": "stddev: 0.000010413582696394516", + "extra": "mean: 164.89274096579976 usec\nrounds: 5424" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_items_stack_nested", + "value": 692.2011774452451, + "unit": "iter/sec", + "range": "stddev: 0.000021237609484040297", + "extra": "mean: 1.4446667133545905 msec\nrounds: 614" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_items_stack_nested_leaf", + "value": 755.0836219474934, + "unit": "iter/sec", + "range": "stddev: 0.000020299002976245728", + "extra": "mean: 1.3243566287675852 msec\nrounds: 730" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_items_stack_nested_locked", + "value": 1294.3749544448572, + "unit": "iter/sec", + "range": "stddev: 0.00003372071760304257", + "extra": "mean: 772.5736631151741 usec\nrounds: 1220" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_keys", + "value": 258142.60603450806, + "unit": "iter/sec", + "range": "stddev: 2.3006945764634933e-7", + "extra": "mean: 3.87382778597316 usec\nrounds: 85237" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_keys_nested", + "value": 6794.014903385893, + "unit": "iter/sec", + "range": "stddev: 0.000580899125860603", + "extra": "mean: 147.18837303427696 usec\nrounds: 5659" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_keys_nested_locked", + "value": 7133.13784367394, + "unit": "iter/sec", + "range": "stddev: 0.00000619362486607265", + "extra": "mean: 140.19075782852778 usec\nrounds: 6834" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_keys_nested_leaf", + "value": 7234.75260064688, + "unit": "iter/sec", + "range": "stddev: 0.000004265008827808462", + "extra": "mean: 138.2217271549254 usec\nrounds: 3086" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_keys_stack_nested", + "value": 728.2321331278434, + "unit": "iter/sec", + "range": "stddev: 0.000059863544645297", + "extra": "mean: 1.373188512988134 msec\nrounds: 616" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_keys_stack_nested_leaf", + "value": 726.1031542051477, + "unit": "iter/sec", + "range": "stddev: 0.00005516883105889427", + "extra": "mean: 1.3772147858174262 msec\nrounds: 691" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_keys_stack_nested_locked", + "value": 1489.3675631027334, + "unit": "iter/sec", + "range": "stddev: 0.000013769002922932278", + "extra": "mean: 671.4259292157165 usec\nrounds: 1441" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_values", + "value": 878208.3277522952, + "unit": "iter/sec", + "range": "stddev: 1.0362255179609059e-7", + "extra": "mean: 1.138681982849593 usec\nrounds: 168606" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_values_nested", + "value": 20535.737549161808, + "unit": "iter/sec", + "range": "stddev: 0.0000016149060345774404", + "extra": "mean: 48.6955970101408 usec\nrounds: 15519" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_values_nested_locked", + "value": 20576.209410529853, + "unit": "iter/sec", + "range": "stddev: 0.0000020211825581394037", + "extra": "mean: 48.59981642139835 usec\nrounds: 18488" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_values_nested_leaf", + "value": 22759.851099534386, + "unit": "iter/sec", + "range": "stddev: 0.0000025729549070426115", + "extra": "mean: 43.93701855195607 usec\nrounds: 539" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_values_stack_nested", + "value": 854.1390434530979, + "unit": "iter/sec", + "range": "stddev: 0.00002861245023186097", + "extra": "mean: 1.17076956926968 msec\nrounds: 794" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_values_stack_nested_leaf", + "value": 859.9977888454722, + "unit": "iter/sec", + "range": "stddev: 0.00004944127483849031", + "extra": "mean: 1.1627936873447984 msec\nrounds: 806" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_values_stack_nested_locked", + "value": 1949.2200640057608, + "unit": "iter/sec", + "range": "stddev: 0.000011663149422881754", + "extra": "mean: 513.025706263736 usec\nrounds: 1852" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_membership", + "value": 756803.4972312617, + "unit": "iter/sec", + "range": "stddev: 1.415186000349463e-7", + "extra": "mean: 1.3213469594927403 usec\nrounds: 96628" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_membership_nested", + "value": 362186.6938501415, + "unit": "iter/sec", + "range": "stddev: 2.9460406505863097e-7", + "extra": "mean: 2.761007008208204 usec\nrounds: 161239" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_membership_nested_leaf", + "value": 356178.37507792655, + "unit": "iter/sec", + "range": "stddev: 2.5422401445081763e-7", + "extra": "mean: 2.807582014998004 usec\nrounds: 136725" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_membership_stacked_nested", + "value": 88005.6667734549, + "unit": "iter/sec", + "range": "stddev: 0.000001105659631146529", + "extra": "mean: 11.36290464765423 usec\nrounds: 35395" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_membership_stacked_nested_leaf", + "value": 86934.10374994042, + "unit": "iter/sec", + "range": "stddev: 6.566258294607602e-7", + "extra": "mean: 11.50296554360791 usec\nrounds: 32737" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_membership_nested_last", + "value": 169618.1293580388, + "unit": "iter/sec", + "range": "stddev: 5.197355425944612e-7", + "extra": "mean: 5.895596206518395 usec\nrounds: 86200" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_membership_nested_leaf_last", + "value": 156154.39304512684, + "unit": "iter/sec", + "range": "stddev: 0.000003356894604252797", + "extra": "mean: 6.403918458515679 usec\nrounds: 27998" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_membership_stacked_nested_last", + "value": 6036.675047679644, + "unit": "iter/sec", + "range": "stddev: 0.000009804999295490123", + "extra": "mean: 165.65410463569287 usec\nrounds: 5199" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_membership_stacked_nested_leaf_last", + "value": 74067.77615121416, + "unit": "iter/sec", + "range": "stddev: 7.43798578227596e-7", + "extra": "mean: 13.50114789403742 usec\nrounds: 24646" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_nested_getleaf", + "value": 95481.7039453431, + "unit": "iter/sec", + "range": "stddev: 4.84769371632633e-7", + "extra": "mean: 10.473210664238177 usec\nrounds: 71398" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_nested_get", + "value": 100533.0519023396, + "unit": "iter/sec", + "range": "stddev: 6.844520862721521e-7", + "extra": "mean: 9.946977447490859 usec\nrounds: 73606" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_stacked_getleaf", + "value": 1616.3843770477326, + "unit": "iter/sec", + "range": "stddev: 0.000012467110214476608", + "extra": "mean: 618.6647274000901 usec\nrounds: 1427" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_stacked_get", + "value": 1696.0252619033242, + "unit": "iter/sec", + "range": "stddev: 0.00002661636378641538", + "extra": "mean: 589.6138592167982 usec\nrounds: 1584" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_nested_getitemleaf", + "value": 94279.77966954361, + "unit": "iter/sec", + "range": "stddev: 9.49364840363644e-7", + "extra": "mean: 10.606728224281612 usec\nrounds: 63821" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_nested_getitem", + "value": 100130.6632366452, + "unit": "iter/sec", + "range": "stddev: 5.15138508565642e-7", + "extra": "mean: 9.986950726938021 usec\nrounds: 74767" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_stacked_getitemleaf", + "value": 1621.7127249853627, + "unit": "iter/sec", + "range": "stddev: 0.000029966090173731818", + "extra": "mean: 616.6320240281927 usec\nrounds: 1415" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_stacked_getitem", + "value": 1705.3921225432969, + "unit": "iter/sec", + "range": "stddev: 0.000011020496942788785", + "extra": "mean: 586.3754070287796 usec\nrounds: 1565" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_lock_nested", + "value": 2035.5863775376254, + "unit": "iter/sec", + "range": "stddev: 0.00019528252758542095", + "extra": "mean: 491.25893699959994 usec\nrounds: 1000" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_lock_stack_nested", + "value": 121.30358415869281, + "unit": "iter/sec", + "range": "stddev: 0.015246090448835372", + "extra": "mean: 8.243779496999622 msec\nrounds: 1000" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_unlock_nested", + "value": 1975.0038808368436, + "unit": "iter/sec", + "range": "stddev: 0.0019516000853643555", + "extra": "mean: 506.3281189990789 usec\nrounds: 1000" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_unlock_stack_nested", + "value": 205.21366994966738, + "unit": "iter/sec", + "range": "stddev: 0.00046767095067153905", + "extra": "mean: 4.872969720999919 msec\nrounds: 1000" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_flatten_speed", + "value": 3718.0732185667166, + "unit": "iter/sec", + "range": "stddev: 0.00001339563117706748", + "extra": "mean: 268.95651086330435 usec\nrounds: 3314" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_unflatten_speed", + "value": 2109.4176545575533, + "unit": "iter/sec", + "range": "stddev: 0.00000789951222035136", + "extra": "mean: 474.0644878170171 usec\nrounds: 2011" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_common_ops", + "value": 1390.5619003609324, + "unit": "iter/sec", + "range": "stddev: 0.00015170716065069452", + "extra": "mean: 719.133754304962 usec\nrounds: 871" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_creation", + "value": 406237.2170772195, + "unit": "iter/sec", + "range": "stddev: 6.40089119674693e-7", + "extra": "mean: 2.4616159178983232 usec\nrounds: 98242" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_creation_empty", + "value": 109573.92762413014, + "unit": "iter/sec", + "range": "stddev: 5.925729396146033e-7", + "extra": "mean: 9.126258606246967 usec\nrounds: 21554" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_creation_nested_1", + "value": 78036.59984006025, + "unit": "iter/sec", + "range": "stddev: 8.778372461907372e-7", + "extra": "mean: 12.814499889148784 usec\nrounds: 22537" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_creation_nested_2", + "value": 62738.772922648335, + "unit": "iter/sec", + "range": "stddev: 9.125807579183556e-7", + "extra": "mean: 15.939106766288154 usec\nrounds: 20765" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_clone", + "value": 76231.28057303852, + "unit": "iter/sec", + "range": "stddev: 0.0000015842209972962496", + "extra": "mean: 13.117974570057008 usec\nrounds: 14825" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_getitem[int]", + "value": 76690.22443506791, + "unit": "iter/sec", + "range": "stddev: 0.0000016796683990939358", + "extra": "mean: 13.039471554118089 usec\nrounds: 16382" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_getitem[slice_int]", + "value": 39905.84184052706, + "unit": "iter/sec", + "range": "stddev: 0.000004543337692621837", + "extra": "mean: 25.05898770401162 usec\nrounds: 12687" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_getitem[range]", + "value": 22113.38318032059, + "unit": "iter/sec", + "range": "stddev: 0.000004424363137830844", + "extra": "mean: 45.22148383382295 usec\nrounds: 5227" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_getitem[tuple]", + "value": 49136.09072694018, + "unit": "iter/sec", + "range": "stddev: 0.000001373729698943646", + "extra": "mean: 20.35163939999246 usec\nrounds: 15599" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_getitem[list]", + "value": 24470.886120616797, + "unit": "iter/sec", + "range": "stddev: 0.0000048820492835882485", + "extra": "mean: 40.864887159010436 usec\nrounds: 8029" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_setitem_dim[int]", + "value": 34578.02106856719, + "unit": "iter/sec", + "range": "stddev: 0.0000025262260849529847", + "extra": "mean: 28.92010500013953 usec\nrounds: 1000" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_setitem_dim[slice_int]", + "value": 18876.37900907297, + "unit": "iter/sec", + "range": "stddev: 0.0000029076440403017254", + "extra": "mean: 52.97626200021455 usec\nrounds: 1000" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_setitem_dim[range]", + "value": 13412.460951399582, + "unit": "iter/sec", + "range": "stddev: 0.000005021369118937627", + "extra": "mean: 74.55753300035894 usec\nrounds: 1000" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_setitem_dim[tuple]", + "value": 23226.22590202361, + "unit": "iter/sec", + "range": "stddev: 0.000003971354975618318", + "extra": "mean: 43.0547780004531 usec\nrounds: 1000" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_setitem", + "value": 52903.57667867985, + "unit": "iter/sec", + "range": "stddev: 0.0000019187874735758146", + "extra": "mean: 18.902313657802274 usec\nrounds: 20296" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_set", + "value": 54219.45326089553, + "unit": "iter/sec", + "range": "stddev: 0.0000018930265018414464", + "extra": "mean: 18.443564806678452 usec\nrounds: 20214" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_set_shared", + "value": 7009.445934265767, + "unit": "iter/sec", + "range": "stddev: 0.00009454170324652787", + "extra": "mean: 142.66462847105888 usec\nrounds: 3709" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_update", + "value": 39747.40229594913, + "unit": "iter/sec", + "range": "stddev: 0.0000024061835218417112", + "extra": "mean: 25.158876863304233 usec\nrounds: 18784" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_update_nested", + "value": 27902.61565969159, + "unit": "iter/sec", + "range": "stddev: 0.0000029400186985105886", + "extra": "mean: 35.83893396218801 usec\nrounds: 16112" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_set_nested", + "value": 49846.95625783337, + "unit": "iter/sec", + "range": "stddev: 0.0000024432436788473625", + "extra": "mean: 20.06140545126768 usec\nrounds: 18858" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_set_nested_new", + "value": 37124.89004671234, + "unit": "iter/sec", + "range": "stddev: 0.0000033534537643337968", + "extra": "mean: 26.936106712821275 usec\nrounds: 15687" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_select", + "value": 19105.307369332586, + "unit": "iter/sec", + "range": "stddev: 0.0000032566421660930886", + "extra": "mean: 52.34147667287351 usec\nrounds: 9474" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_unbind_speed", + "value": 2674.267514458477, + "unit": "iter/sec", + "range": "stddev: 0.000007632632185774206", + "extra": "mean: 373.9341687372267 usec\nrounds: 966" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_unbind_speed_stack0", + "value": 180.37963696700962, + "unit": "iter/sec", + "range": "stddev: 0.009166360075664069", + "extra": "mean: 5.5438630258630255 msec\nrounds: 232" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_unbind_speed_stack1", + "value": 1587663.771854149, + "unit": "iter/sec", + "range": "stddev: 2.634902329565814e-8", + "extra": "mean: 629.8562817441913 nsec\nrounds: 76197" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_split", + "value": 600.5816075378888, + "unit": "iter/sec", + "range": "stddev: 0.0000801136368906299", + "extra": "mean: 1.6650526547084 msec\nrounds: 446" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_chunk", + "value": 567.0316513651647, + "unit": "iter/sec", + "range": "stddev: 0.002461092114559696", + "extra": "mean: 1.7635699834258571 msec\nrounds: 543" + }, + { + "name": "benchmarks/common/memmap_benchmarks_test.py::test_creation[device0]", + "value": 3378.1314805936704, + "unit": "iter/sec", + "range": "stddev: 0.000016602441648610537", + "extra": "mean: 296.02163377733916 usec\nrounds: 1652" + }, + { + "name": "benchmarks/common/memmap_benchmarks_test.py::test_creation_from_tensor", + "value": 2983.6306176700923, + "unit": "iter/sec", + "range": "stddev: 0.00009751304038930751", + "extra": "mean: 335.1621323623823 usec\nrounds: 1511" + }, + { + "name": "benchmarks/common/memmap_benchmarks_test.py::test_add_one[memmap_tensor0]", + "value": 37446.83189931126, + "unit": "iter/sec", + "range": "stddev: 0.0000033523475703825942", + "extra": "mean: 26.70452877532725 usec\nrounds: 6377" + }, + { + "name": "benchmarks/common/memmap_benchmarks_test.py::test_contiguous[memmap_tensor0]", + "value": 169305.66591941737, + "unit": "iter/sec", + "range": "stddev: 6.9150896435527e-7", + "extra": "mean: 5.906476871695242 usec\nrounds: 39281" + }, + { + "name": "benchmarks/common/memmap_benchmarks_test.py::test_stack[memmap_tensor0]", + "value": 50064.29818917393, + "unit": "iter/sec", + "range": "stddev: 0.0000018366268424162014", + "extra": "mean: 19.97431375591006 usec\nrounds: 10948" + }, + { + "name": "benchmarks/common/memmap_benchmarks_test.py::test_memmaptd_index", + "value": 5121.676041500466, + "unit": "iter/sec", + "range": "stddev: 0.000011397550796489083", + "extra": "mean: 195.24858501340043 usec\nrounds: 3670" + }, + { + "name": "benchmarks/common/memmap_benchmarks_test.py::test_memmaptd_index_astensor", + "value": 3832.7484188967965, + "unit": "iter/sec", + "range": "stddev: 0.000008771518598788454", + "extra": "mean: 260.9093764332792 usec\nrounds: 3140" + }, + { + "name": "benchmarks/common/memmap_benchmarks_test.py::test_memmaptd_index_op", + "value": 1908.6168799093225, + "unit": "iter/sec", + "range": "stddev: 0.000016168790720179094", + "extra": "mean: 523.9396185406835 usec\nrounds: 658" + }, + { + "name": "benchmarks/common/pytree_benchmarks_test.py::test_reshape_pytree", + "value": 42129.74835950898, + "unit": "iter/sec", + "range": "stddev: 0.0000024650895345325163", + "extra": "mean: 23.73619684282527 usec\nrounds: 11720" + }, + { + "name": "benchmarks/common/pytree_benchmarks_test.py::test_reshape_td", + "value": 30854.952100094033, + "unit": "iter/sec", + "range": "stddev: 0.0000017597117708144726", + "extra": "mean: 32.409708391572984 usec\nrounds: 8556" + }, + { + "name": "benchmarks/common/pytree_benchmarks_test.py::test_view_pytree", + "value": 42451.30192904599, + "unit": "iter/sec", + "range": "stddev: 0.0000026391943606511366", + "extra": "mean: 23.55640356263799 usec\nrounds: 12687" + }, + { + "name": "benchmarks/common/pytree_benchmarks_test.py::test_view_td", + "value": 207563.79922065095, + "unit": "iter/sec", + "range": "stddev: 3.327301823013099e-7", + "extra": "mean: 4.8177957994348946 usec\nrounds: 31900" + }, + { + "name": "benchmarks/common/pytree_benchmarks_test.py::test_unbind_pytree", + "value": 37483.98191387788, + "unit": "iter/sec", + "range": "stddev: 0.0000018187706949657246", + "extra": "mean: 26.678062173265676 usec\nrounds: 11098" + }, + { + "name": "benchmarks/common/pytree_benchmarks_test.py::test_unbind_td", + "value": 16866.300650801222, + "unit": "iter/sec", + "range": "stddev: 0.0000023320630777038796", + "extra": "mean: 59.289824170927226 usec\nrounds: 8986" + }, + { + "name": "benchmarks/common/pytree_benchmarks_test.py::test_split_pytree", + "value": 37076.639008170925, + "unit": "iter/sec", + "range": "stddev: 0.0000024152730092105277", + "extra": "mean: 26.97116099923784 usec\nrounds: 8646" + }, + { + "name": "benchmarks/common/pytree_benchmarks_test.py::test_split_td", + "value": 21379.782814386217, + "unit": "iter/sec", + "range": "stddev: 0.000004041782895914077", + "extra": "mean: 46.77315989043215 usec\nrounds: 9125" + }, + { + "name": "benchmarks/common/pytree_benchmarks_test.py::test_add_pytree", + "value": 30629.69093721162, + "unit": "iter/sec", + "range": "stddev: 0.000002271898807328854", + "extra": "mean: 32.64806040811573 usec\nrounds: 8724" + }, + { + "name": "benchmarks/common/pytree_benchmarks_test.py::test_add_td", + "value": 20496.725538038576, + "unit": "iter/sec", + "range": "stddev: 0.000003310274079631964", + "extra": "mean: 48.788280749730646 usec\nrounds: 9122" + }, + { + "name": "benchmarks/distributed/distributed_benchmark_test.py::test_distributed", + "value": 168795.95068067123, + "unit": "iter/sec", + "range": "stddev: 4.1911872409129034e-7", + "extra": "mean: 5.92431273361411 usec\nrounds: 18738" + }, + { + "name": "benchmarks/nn/functional_benchmarks_test.py::test_tdmodule", + "value": 42744.33871517069, + "unit": "iter/sec", + "range": "stddev: 0.000026652014362926245", + "extra": "mean: 23.394911000110596 usec\nrounds: 1000" + }, + { + "name": "benchmarks/nn/functional_benchmarks_test.py::test_tdmodule_dispatch", + "value": 24527.37766770992, + "unit": "iter/sec", + "range": "stddev: 0.000014343145543724592", + "extra": "mean: 40.770766999543184 usec\nrounds: 1000" + }, + { + "name": "benchmarks/nn/functional_benchmarks_test.py::test_tdseq", + "value": 40209.15030855277, + "unit": "iter/sec", + "range": "stddev: 0.000002080748271491382", + "extra": "mean: 24.869960999581053 usec\nrounds: 1000" + }, + { + "name": "benchmarks/nn/functional_benchmarks_test.py::test_tdseq_dispatch", + "value": 22707.973014545758, + "unit": "iter/sec", + "range": "stddev: 0.000012881126800796862", + "extra": "mean: 44.03739600004997 usec\nrounds: 1000" + }, + { + "name": "benchmarks/nn/functional_benchmarks_test.py::test_instantiation_functorch", + "value": 776.3924432525881, + "unit": "iter/sec", + "range": "stddev: 0.00002146027149064373", + "extra": "mean: 1.2880084146757522 msec\nrounds: 586" + }, + { + "name": "benchmarks/nn/functional_benchmarks_test.py::test_instantiation_td", + "value": 979.4552367464794, + "unit": "iter/sec", + "range": "stddev: 0.00009764406985530428", + "extra": "mean: 1.0209757041289251 msec\nrounds: 872" + }, + { + "name": "benchmarks/nn/functional_benchmarks_test.py::test_exec_functorch", + "value": 6550.975878764866, + "unit": "iter/sec", + "range": "stddev: 0.000012038979976543235", + "extra": "mean: 152.6490126824497 usec\nrounds: 2602" + }, + { + "name": "benchmarks/nn/functional_benchmarks_test.py::test_exec_td", + "value": 6855.699190624831, + "unit": "iter/sec", + "range": "stddev: 0.000006984415772269433", + "extra": "mean: 145.8640427758995 usec\nrounds: 2291" + }, + { + "name": "benchmarks/nn/functional_benchmarks_test.py::test_vmap_mlp_speed[True-True]", + "value": 1148.0122295808505, + "unit": "iter/sec", + "range": "stddev: 0.000024649453661314255", + "extra": "mean: 871.0708599028678 usec\nrounds: 1035" + }, + { + "name": "benchmarks/nn/functional_benchmarks_test.py::test_vmap_mlp_speed[True-False]", + "value": 2112.224159366907, + "unit": "iter/sec", + "range": "stddev: 0.000032923599066499854", + "extra": "mean: 473.4345999999016 usec\nrounds: 2010" + }, + { + "name": "benchmarks/nn/functional_benchmarks_test.py::test_vmap_mlp_speed[False-True]", + "value": 1314.1896388023802, + "unit": "iter/sec", + "range": "stddev: 0.00003296955149669985", + "extra": "mean: 760.9251895421265 usec\nrounds: 1224" + }, + { + "name": "benchmarks/nn/functional_benchmarks_test.py::test_vmap_mlp_speed[False-False]", + "value": 2584.746432452793, + "unit": "iter/sec", + "range": "stddev: 0.000017047317019335308", + "extra": "mean: 386.8851456547135 usec\nrounds: 2451" + } + ] } ], "GPU Benchmark Results": [