diff --git a/dev/bench/data.js b/dev/bench/data.js index 5ffaddcaf..51385dc23 100644 --- a/dev/bench/data.js +++ b/dev/bench/data.js @@ -1,5 +1,5 @@ window.BENCHMARK_DATA = { - "lastUpdate": 1701379247334, + "lastUpdate": 1701690491545, "repoUrl": "https://github.com/pytorch/tensordict", "entries": { "CPU Benchmark Results": [ @@ -153521,6 +153521,821 @@ window.BENCHMARK_DATA = { "extra": "mean: 407.7899364611565 usec\nrounds: 2345" } ] + }, + { + "commit": { + "author": { + "email": "vmoens@meta.com", + "name": "Vincent Moens", + "username": "vmoens" + }, + "committer": { + "email": "noreply@github.com", + "name": "GitHub", + "username": "web-flow" + }, + "distinct": true, + "id": "86c239ff93532a56ee848f0de1248624c3d1ffa4", + "message": "[Performance] Make copy_ a no-op if tensors are identical (#588)", + "timestamp": "2023-12-04T11:44:05Z", + "tree_id": "466dcfe838eca82ca50df1739a7dbe5f27560ceb", + "url": "https://github.com/pytorch/tensordict/commit/86c239ff93532a56ee848f0de1248624c3d1ffa4" + }, + "date": 1701690486936, + "tool": "pytest", + "benches": [ + { + "name": "benchmarks/common/common_ops_test.py::test_plain_set_nested", + "value": 64272.260700637125, + "unit": "iter/sec", + "range": "stddev: 5.554404442698035e-7", + "extra": "mean: 15.55881167239053 usec\nrounds: 8533" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_plain_set_stack_nested", + "value": 7200.961085867142, + "unit": "iter/sec", + "range": "stddev: 0.0000029606782248443653", + "extra": "mean: 138.87035189825355 usec\nrounds: 1975" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_plain_set_nested_inplace", + "value": 56222.35119826479, + "unit": "iter/sec", + "range": "stddev: 9.200406395682728e-7", + "extra": "mean: 17.786520461827703 usec\nrounds: 36629" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_plain_set_stack_nested_inplace", + "value": 5744.20505322264, + "unit": "iter/sec", + "range": "stddev: 0.000006240817286540491", + "extra": "mean: 174.08849279135242 usec\nrounds: 3884" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_items", + "value": 416750.51703091257, + "unit": "iter/sec", + "range": "stddev: 1.7207204269709975e-7", + "extra": "mean: 2.3995171190773226 usec\nrounds: 98049" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_items_nested", + "value": 3757.544706410901, + "unit": "iter/sec", + "range": "stddev: 0.000013399861018225456", + "extra": "mean: 266.13123146448766 usec\nrounds: 3102" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_items_nested_locked", + "value": 3767.1661124434386, + "unit": "iter/sec", + "range": "stddev: 0.000005260627135641513", + "extra": "mean: 265.4515277934972 usec\nrounds: 3634" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_items_nested_leaf", + "value": 6066.344807829845, + "unit": "iter/sec", + "range": "stddev: 0.00000491714920737751", + "extra": "mean: 164.843910407021 usec\nrounds: 5391" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_items_stack_nested", + "value": 684.1412107479103, + "unit": "iter/sec", + "range": "stddev: 0.000037212975110378526", + "extra": "mean: 1.4616865411554283 msec\nrounds: 571" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_items_stack_nested_leaf", + "value": 757.6346039856194, + "unit": "iter/sec", + "range": "stddev: 0.000046915467494576824", + "extra": "mean: 1.3198974739793972 msec\nrounds: 711" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_items_stack_nested_locked", + "value": 1306.7428751187463, + "unit": "iter/sec", + "range": "stddev: 0.00003263618913383692", + "extra": "mean: 765.2614902599933 usec\nrounds: 1232" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_keys", + "value": 248439.54920364046, + "unit": "iter/sec", + "range": "stddev: 2.195247668393677e-7", + "extra": "mean: 4.025124032004751 usec\nrounds: 88961" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_keys_nested", + "value": 6725.885499212732, + "unit": "iter/sec", + "range": "stddev: 0.0005971565811786517", + "extra": "mean: 148.6793077457311 usec\nrounds: 5771" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_keys_nested_locked", + "value": 7157.2361451581355, + "unit": "iter/sec", + "range": "stddev: 0.0000025776248296221913", + "extra": "mean: 139.71873775277055 usec\nrounds: 6879" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_keys_nested_leaf", + "value": 7083.477989216358, + "unit": "iter/sec", + "range": "stddev: 0.0000037798037717765747", + "extra": "mean: 141.17358754024016 usec\nrounds: 2456" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_keys_stack_nested", + "value": 713.0527248093774, + "unit": "iter/sec", + "range": "stddev: 0.00006042701638769853", + "extra": "mean: 1.4024208381888352 msec\nrounds: 618" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_keys_stack_nested_leaf", + "value": 719.493981687004, + "unit": "iter/sec", + "range": "stddev: 0.000021952256450884392", + "extra": "mean: 1.3898656909614324 msec\nrounds: 686" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_keys_stack_nested_locked", + "value": 1474.7288702844887, + "unit": "iter/sec", + "range": "stddev: 0.00002798553958889217", + "extra": "mean: 678.0907461363328 usec\nrounds: 1359" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_values", + "value": 872788.1272749081, + "unit": "iter/sec", + "range": "stddev: 5.928481449653489e-8", + "extra": "mean: 1.145753440897831 usec\nrounds: 195734" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_values_nested", + "value": 20382.398995515512, + "unit": "iter/sec", + "range": "stddev: 0.0000034612966451904022", + "extra": "mean: 49.0619382056066 usec\nrounds: 15940" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_values_nested_locked", + "value": 20564.60525408873, + "unit": "iter/sec", + "range": "stddev: 0.0000013150414938455366", + "extra": "mean: 48.62724023361335 usec\nrounds: 18661" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_values_nested_leaf", + "value": 22817.429473391065, + "unit": "iter/sec", + "range": "stddev: 9.087058700307879e-7", + "extra": "mean: 43.82614619960443 usec\nrounds: 855" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_values_stack_nested", + "value": 827.3492195690875, + "unit": "iter/sec", + "range": "stddev: 0.00005270977691975866", + "extra": "mean: 1.2086794504028602 msec\nrounds: 746" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_values_stack_nested_leaf", + "value": 849.8165613079924, + "unit": "iter/sec", + "range": "stddev: 0.00002253511430863541", + "extra": "mean: 1.1767245374235271 msec\nrounds: 815" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_values_stack_nested_locked", + "value": 1851.857237181767, + "unit": "iter/sec", + "range": "stddev: 0.00014772724682059576", + "extra": "mean: 539.9984296423635 usec\nrounds: 1869" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_membership", + "value": 746784.7049174516, + "unit": "iter/sec", + "range": "stddev: 1.0793847362815923e-7", + "extra": "mean: 1.3390740241667622 usec\nrounds: 69653" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_membership_nested", + "value": 358840.73826873826, + "unit": "iter/sec", + "range": "stddev: 2.1987488114197352e-7", + "extra": "mean: 2.7867515957764337 usec\nrounds: 158705" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_membership_nested_leaf", + "value": 357921.6336746965, + "unit": "iter/sec", + "range": "stddev: 2.3289568715755996e-7", + "extra": "mean: 2.793907676753811 usec\nrounds: 158454" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_membership_stacked_nested", + "value": 88196.79749273106, + "unit": "iter/sec", + "range": "stddev: 7.167037889555989e-7", + "extra": "mean: 11.338280169213823 usec\nrounds: 34936" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_membership_stacked_nested_leaf", + "value": 87715.91116740325, + "unit": "iter/sec", + "range": "stddev: 0.0000017730395744101062", + "extra": "mean: 11.400440201681645 usec\nrounds: 47217" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_membership_nested_last", + "value": 168981.371872055, + "unit": "iter/sec", + "range": "stddev: 6.800317845660462e-7", + "extra": "mean: 5.917812057752464 usec\nrounds: 88176" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_membership_nested_leaf_last", + "value": 170971.3631509529, + "unit": "iter/sec", + "range": "stddev: 4.598245337303537e-7", + "extra": "mean: 5.8489327193179514 usec\nrounds: 91408" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_membership_stacked_nested_last", + "value": 5998.250116564432, + "unit": "iter/sec", + "range": "stddev: 0.000007790019017943897", + "extra": "mean: 166.7152887203646 usec\nrounds: 5133" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_membership_stacked_nested_leaf_last", + "value": 74284.78197833321, + "unit": "iter/sec", + "range": "stddev: 7.067803056039466e-7", + "extra": "mean: 13.46170740989281 usec\nrounds: 39205" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_nested_getleaf", + "value": 93880.08729017673, + "unit": "iter/sec", + "range": "stddev: 0.0000016298595842118084", + "extra": "mean: 10.651886133308233 usec\nrounds: 70240" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_nested_get", + "value": 100169.29334591252, + "unit": "iter/sec", + "range": "stddev: 5.757912760605594e-7", + "extra": "mean: 9.983099277207845 usec\nrounds: 75959" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_stacked_getleaf", + "value": 1566.8876151033278, + "unit": "iter/sec", + "range": "stddev: 0.00002250736147804212", + "extra": "mean: 638.2078652999344 usec\nrounds: 1366" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_stacked_get", + "value": 1653.318183074342, + "unit": "iter/sec", + "range": "stddev: 0.00001360036545519102", + "extra": "mean: 604.8442521454048 usec\nrounds: 1515" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_nested_getitemleaf", + "value": 95249.31526648473, + "unit": "iter/sec", + "range": "stddev: 6.421351514591982e-7", + "extra": "mean: 10.498763137585188 usec\nrounds: 64814" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_nested_getitem", + "value": 100594.06599168763, + "unit": "iter/sec", + "range": "stddev: 4.4031654974878966e-7", + "extra": "mean: 9.940944231070576 usec\nrounds: 71348" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_stacked_getitemleaf", + "value": 1565.3591275829249, + "unit": "iter/sec", + "range": "stddev: 0.000029090926793796165", + "extra": "mean: 638.8310403530866 usec\nrounds: 1363" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_stacked_getitem", + "value": 1652.1038236397258, + "unit": "iter/sec", + "range": "stddev: 0.000010348789517333346", + "extra": "mean: 605.2888357808619 usec\nrounds: 1498" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_lock_nested", + "value": 1789.6414237196407, + "unit": "iter/sec", + "range": "stddev: 0.0003803424746611366", + "extra": "mean: 558.7711520007019 usec\nrounds: 1000" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_lock_stack_nested", + "value": 198.4150145930312, + "unit": "iter/sec", + "range": "stddev: 0.0011462301321293695", + "extra": "mean: 5.03994116600046 msec\nrounds: 1000" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_unlock_nested", + "value": 2274.455171153501, + "unit": "iter/sec", + "range": "stddev: 0.00008021690751538575", + "extra": "mean: 439.66573299962874 usec\nrounds: 1000" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_unlock_stack_nested", + "value": 143.2901767637305, + "unit": "iter/sec", + "range": "stddev: 0.01167797689761069", + "extra": "mean: 6.9788454629998 msec\nrounds: 1000" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_flatten_speed", + "value": 3731.350245056531, + "unit": "iter/sec", + "range": "stddev: 0.000006594195964940675", + "extra": "mean: 267.9994999999925 usec\nrounds: 3348" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_unflatten_speed", + "value": 2179.913449066858, + "unit": "iter/sec", + "range": "stddev: 0.0000354226450001459", + "extra": "mean: 458.73380910056943 usec\nrounds: 2022" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_common_ops", + "value": 1472.0784316875265, + "unit": "iter/sec", + "range": "stddev: 0.0001234952802670521", + "extra": "mean: 679.3116307353566 usec\nrounds: 937" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_creation", + "value": 386873.8989093904, + "unit": "iter/sec", + "range": "stddev: 2.1597735165578662e-7", + "extra": "mean: 2.584821573176767 usec\nrounds: 91567" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_creation_empty", + "value": 113283.22472815018, + "unit": "iter/sec", + "range": "stddev: 4.857516853102323e-7", + "extra": "mean: 8.82743232636373 usec\nrounds: 23015" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_creation_nested_1", + "value": 82193.0899860279, + "unit": "iter/sec", + "range": "stddev: 6.325125943848155e-7", + "extra": "mean: 12.166472877099414 usec\nrounds: 24057" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_creation_nested_2", + "value": 64393.20709062516, + "unit": "iter/sec", + "range": "stddev: 8.088034882838915e-7", + "extra": "mean: 15.529588370907334 usec\nrounds: 22083" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_clone", + "value": 73885.93987958277, + "unit": "iter/sec", + "range": "stddev: 0.0000018166062039460133", + "extra": "mean: 13.534374762367129 usec\nrounds: 13670" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_getitem[int]", + "value": 76786.78776784017, + "unit": "iter/sec", + "range": "stddev: 7.634205301196367e-7", + "extra": "mean: 13.023073748356746 usec\nrounds: 15702" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_getitem[slice_int]", + "value": 39208.195636217504, + "unit": "iter/sec", + "range": "stddev: 0.000002072116484619773", + "extra": "mean: 25.504871718102663 usec\nrounds: 11997" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_getitem[range]", + "value": 21995.04285472427, + "unit": "iter/sec", + "range": "stddev: 0.0000027679556659612414", + "extra": "mean: 45.46478979854372 usec\nrounds: 5666" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_getitem[tuple]", + "value": 49034.855877657625, + "unit": "iter/sec", + "range": "stddev: 0.0000013095772624557309", + "extra": "mean: 20.39365635120879 usec\nrounds: 15478" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_getitem[list]", + "value": 24624.623719541814, + "unit": "iter/sec", + "range": "stddev: 0.000002662132306067149", + "extra": "mean: 40.60975759018042 usec\nrounds: 8399" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_setitem_dim[int]", + "value": 34288.47303874784, + "unit": "iter/sec", + "range": "stddev: 0.000004165139435371316", + "extra": "mean: 29.16431999960878 usec\nrounds: 1000" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_setitem_dim[slice_int]", + "value": 19220.707190368772, + "unit": "iter/sec", + "range": "stddev: 0.000003413990397152479", + "extra": "mean: 52.027222000504025 usec\nrounds: 1000" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_setitem_dim[range]", + "value": 13618.937153795, + "unit": "iter/sec", + "range": "stddev: 0.000003209973553952264", + "extra": "mean: 73.42716900058122 usec\nrounds: 1000" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_setitem_dim[tuple]", + "value": 23612.288117907723, + "unit": "iter/sec", + "range": "stddev: 0.0000054644810568729274", + "extra": "mean: 42.350830000316364 usec\nrounds: 1000" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_setitem", + "value": 53137.37947713408, + "unit": "iter/sec", + "range": "stddev: 0.0000018736469424015588", + "extra": "mean: 18.819144072212232 usec\nrounds: 19872" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_set", + "value": 55143.50217981865, + "unit": "iter/sec", + "range": "stddev: 0.0000019281659458766906", + "extra": "mean: 18.134502896444232 usec\nrounds: 20543" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_set_shared", + "value": 7140.14685126069, + "unit": "iter/sec", + "range": "stddev: 0.00007642969816501206", + "extra": "mean: 140.05314187948898 usec\nrounds: 3799" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_update", + "value": 50634.505883970254, + "unit": "iter/sec", + "range": "stddev: 0.000003014446469630161", + "extra": "mean: 19.749378068219237 usec\nrounds: 25953" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_update_nested", + "value": 36693.10458118684, + "unit": "iter/sec", + "range": "stddev: 0.0000024644612131337585", + "extra": "mean: 27.253076876812337 usec\nrounds: 19967" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_set_nested", + "value": 48968.19125179494, + "unit": "iter/sec", + "range": "stddev: 0.0000019040582494973747", + "extra": "mean: 20.421419996053963 usec\nrounds: 15543" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_set_nested_new", + "value": 38787.908482237675, + "unit": "iter/sec", + "range": "stddev: 0.000001957081601690533", + "extra": "mean: 25.78123026298091 usec\nrounds: 15960" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_select", + "value": 19510.371022504754, + "unit": "iter/sec", + "range": "stddev: 0.000003916879276922219", + "extra": "mean: 51.25479155914173 usec\nrounds: 9691" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_unbind_speed", + "value": 2726.99390918679, + "unit": "iter/sec", + "range": "stddev: 0.000018471867369851212", + "extra": "mean: 366.70415604199405 usec\nrounds: 2243" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_unbind_speed_stack0", + "value": 219.25194401264332, + "unit": "iter/sec", + "range": "stddev: 0.0059203175239201525", + "extra": "mean: 4.560962980297836 msec\nrounds: 203" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_unbind_speed_stack1", + "value": 1570545.8198155684, + "unit": "iter/sec", + "range": "stddev: 3.7196268769634144e-8", + "extra": "mean: 636.7213152160286 nsec\nrounds: 74991" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_split", + "value": 611.4151613763734, + "unit": "iter/sec", + "range": "stddev: 0.000015059462124359509", + "extra": "mean: 1.63554989010883 msec\nrounds: 455" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_chunk", + "value": 578.0757120338105, + "unit": "iter/sec", + "range": "stddev: 0.002407640754087599", + "extra": "mean: 1.729877210169854 msec\nrounds: 590" + }, + { + "name": "benchmarks/common/memmap_benchmarks_test.py::test_creation[device0]", + "value": 3317.504431287118, + "unit": "iter/sec", + "range": "stddev: 0.00009746854063062854", + "extra": "mean: 301.43139842379117 usec\nrounds: 1649" + }, + { + "name": "benchmarks/common/memmap_benchmarks_test.py::test_creation_from_tensor", + "value": 2773.695970422222, + "unit": "iter/sec", + "range": "stddev: 0.0013419732946362093", + "extra": "mean: 360.52978071990213 usec\nrounds: 2002" + }, + { + "name": "benchmarks/common/memmap_benchmarks_test.py::test_add_one[memmap_tensor0]", + "value": 39009.57921210363, + "unit": "iter/sec", + "range": "stddev: 0.00000406393962003831", + "extra": "mean: 25.634729217733444 usec\nrounds: 6869" + }, + { + "name": "benchmarks/common/memmap_benchmarks_test.py::test_contiguous[memmap_tensor0]", + "value": 173519.0325124351, + "unit": "iter/sec", + "range": "stddev: 5.693574449532092e-7", + "extra": "mean: 5.763056568035761 usec\nrounds: 33800" + }, + { + "name": "benchmarks/common/memmap_benchmarks_test.py::test_stack[memmap_tensor0]", + "value": 52290.66167495306, + "unit": "iter/sec", + "range": "stddev: 0.0000016873961650282065", + "extra": "mean: 19.12387351715219 usec\nrounds: 11045" + }, + { + "name": "benchmarks/common/memmap_benchmarks_test.py::test_memmaptd_index", + "value": 4917.892246589996, + "unit": "iter/sec", + "range": "stddev: 0.000014778602235084652", + "extra": "mean: 203.3391440598129 usec\nrounds: 2138" + }, + { + "name": "benchmarks/common/memmap_benchmarks_test.py::test_memmaptd_index_astensor", + "value": 3825.8606690071097, + "unit": "iter/sec", + "range": "stddev: 0.000020920843124278838", + "extra": "mean: 261.379095193114 usec\nrounds: 3162" + }, + { + "name": "benchmarks/common/memmap_benchmarks_test.py::test_memmaptd_index_op", + "value": 1955.6303281252283, + "unit": "iter/sec", + "range": "stddev: 0.000010429065199414941", + "extra": "mean: 511.34408462495736 usec\nrounds: 1678" + }, + { + "name": "benchmarks/common/pytree_benchmarks_test.py::test_reshape_pytree", + "value": 41807.65602599779, + "unit": "iter/sec", + "range": "stddev: 0.000002695665532186528", + "extra": "mean: 23.919063995794385 usec\nrounds: 12032" + }, + { + "name": "benchmarks/common/pytree_benchmarks_test.py::test_reshape_td", + "value": 31353.68324028356, + "unit": "iter/sec", + "range": "stddev: 0.0000016602309237738362", + "extra": "mean: 31.894179460076604 usec\nrounds: 1889" + }, + { + "name": "benchmarks/common/pytree_benchmarks_test.py::test_view_pytree", + "value": 42865.05222902789, + "unit": "iter/sec", + "range": "stddev: 0.000001223281869007797", + "extra": "mean: 23.329027914325216 usec\nrounds: 13219" + }, + { + "name": "benchmarks/common/pytree_benchmarks_test.py::test_view_td", + "value": 206273.55539824502, + "unit": "iter/sec", + "range": "stddev: 4.986223016299189e-7", + "extra": "mean: 4.8479311760023505 usec\nrounds: 31428" + }, + { + "name": "benchmarks/common/pytree_benchmarks_test.py::test_unbind_pytree", + "value": 38161.81067755061, + "unit": "iter/sec", + "range": "stddev: 0.000001481416665456087", + "extra": "mean: 26.20420735403597 usec\nrounds: 11150" + }, + { + "name": "benchmarks/common/pytree_benchmarks_test.py::test_unbind_td", + "value": 17052.63953607153, + "unit": "iter/sec", + "range": "stddev: 0.0000019678789168049236", + "extra": "mean: 58.64194794504953 usec\nrounds: 9490" + }, + { + "name": "benchmarks/common/pytree_benchmarks_test.py::test_split_pytree", + "value": 37859.83191366538, + "unit": "iter/sec", + "range": "stddev: 0.0000023559058527436304", + "extra": "mean: 26.413218164316607 usec\nrounds: 9447" + }, + { + "name": "benchmarks/common/pytree_benchmarks_test.py::test_split_td", + "value": 21946.89148299909, + "unit": "iter/sec", + "range": "stddev: 0.000002407204403238616", + "extra": "mean: 45.56453932324032 usec\nrounds: 9638" + }, + { + "name": "benchmarks/common/pytree_benchmarks_test.py::test_add_pytree", + "value": 31415.620660961496, + "unit": "iter/sec", + "range": "stddev: 0.000002034296055218516", + "extra": "mean: 31.831298537502594 usec\nrounds: 9235" + }, + { + "name": "benchmarks/common/pytree_benchmarks_test.py::test_add_td", + "value": 21462.961814414888, + "unit": "iter/sec", + "range": "stddev: 0.0000027625898538467767", + "extra": "mean: 46.591892053238574 usec\nrounds: 9727" + }, + { + "name": "benchmarks/distributed/distributed_benchmark_test.py::test_distributed", + "value": 170753.75169886218, + "unit": "iter/sec", + "range": "stddev: 4.315965285564031e-7", + "extra": "mean: 5.856386697515024 usec\nrounds: 16884" + }, + { + "name": "benchmarks/nn/functional_benchmarks_test.py::test_tdmodule", + "value": 44936.42641556756, + "unit": "iter/sec", + "range": "stddev: 0.000048245155782332045", + "extra": "mean: 22.25366099992243 usec\nrounds: 1000" + }, + { + "name": "benchmarks/nn/functional_benchmarks_test.py::test_tdmodule_dispatch", + "value": 25835.916559179957, + "unit": "iter/sec", + "range": "stddev: 0.000013163196632248638", + "extra": "mean: 38.70580699970105 usec\nrounds: 1000" + }, + { + "name": "benchmarks/nn/functional_benchmarks_test.py::test_tdseq", + "value": 37073.199884087524, + "unit": "iter/sec", + "range": "stddev: 0.000007135684297375582", + "extra": "mean: 26.9736629998647 usec\nrounds: 1000" + }, + { + "name": "benchmarks/nn/functional_benchmarks_test.py::test_tdseq_dispatch", + "value": 22006.566187403747, + "unit": "iter/sec", + "range": "stddev: 0.000006735113406830076", + "extra": "mean: 45.44098299953703 usec\nrounds: 1000" + }, + { + "name": "benchmarks/nn/functional_benchmarks_test.py::test_instantiation_functorch", + "value": 760.8861447160008, + "unit": "iter/sec", + "range": "stddev: 0.000032599593886335716", + "extra": "mean: 1.3142570763635708 msec\nrounds: 550" + }, + { + "name": "benchmarks/nn/functional_benchmarks_test.py::test_instantiation_td", + "value": 968.9044945051002, + "unit": "iter/sec", + "range": "stddev: 0.0001122116440773693", + "extra": "mean: 1.0320934681088283 msec\nrounds: 878" + }, + { + "name": "benchmarks/nn/functional_benchmarks_test.py::test_exec_functorch", + "value": 6192.499033267969, + "unit": "iter/sec", + "range": "stddev: 0.00001263367315112812", + "extra": "mean: 161.48569335702743 usec\nrounds: 2710" + }, + { + "name": "benchmarks/nn/functional_benchmarks_test.py::test_exec_functional_call", + "value": 6768.6859568993805, + "unit": "iter/sec", + "range": "stddev: 0.000007549181180612372", + "extra": "mean: 147.73916331288666 usec\nrounds: 3429" + }, + { + "name": "benchmarks/nn/functional_benchmarks_test.py::test_exec_td", + "value": 7019.075793096863, + "unit": "iter/sec", + "range": "stddev: 0.000007711083112789435", + "extra": "mean: 142.46889896579864 usec\nrounds: 2128" + }, + { + "name": "benchmarks/nn/functional_benchmarks_test.py::test_exec_td_decorator", + "value": 5723.136459298392, + "unit": "iter/sec", + "range": "stddev: 0.00004949623335676117", + "extra": "mean: 174.72936511504943 usec\nrounds: 3566" + }, + { + "name": "benchmarks/nn/functional_benchmarks_test.py::test_vmap_mlp_speed[True-True]", + "value": 1100.0186286161208, + "unit": "iter/sec", + "range": "stddev: 0.00003903695875848079", + "extra": "mean: 909.0755138011169 usec\nrounds: 942" + }, + { + "name": "benchmarks/nn/functional_benchmarks_test.py::test_vmap_mlp_speed[True-False]", + "value": 2130.526496687744, + "unit": "iter/sec", + "range": "stddev: 0.000019581794557042734", + "extra": "mean: 469.3675490798474 usec\nrounds: 1956" + }, + { + "name": "benchmarks/nn/functional_benchmarks_test.py::test_vmap_mlp_speed[False-True]", + "value": 1263.3447484235937, + "unit": "iter/sec", + "range": "stddev: 0.00003077621812918979", + "extra": "mean: 791.5495760344147 usec\nrounds: 1210" + }, + { + "name": "benchmarks/nn/functional_benchmarks_test.py::test_vmap_mlp_speed[False-False]", + "value": 2591.6232024388246, + "unit": "iter/sec", + "range": "stddev: 0.00001628013312071578", + "extra": "mean: 385.8585611746949 usec\nrounds: 2452" + }, + { + "name": "benchmarks/nn/functional_benchmarks_test.py::test_vmap_mlp_speed_decorator[True-True]", + "value": 552.8019779212365, + "unit": "iter/sec", + "range": "stddev: 0.00010173432213529649", + "extra": "mean: 1.8089660311282039 msec\nrounds: 514" + }, + { + "name": "benchmarks/nn/functional_benchmarks_test.py::test_vmap_mlp_speed_decorator[True-False]", + "value": 1924.283819664087, + "unit": "iter/sec", + "range": "stddev: 0.00005065684868489742", + "extra": "mean: 519.6738598439003 usec\nrounds: 1798" + }, + { + "name": "benchmarks/nn/functional_benchmarks_test.py::test_vmap_mlp_speed_decorator[False-True]", + "value": 660.2226444500709, + "unit": "iter/sec", + "range": "stddev: 0.00009524487282850242", + "extra": "mean: 1.5146405661880091 msec\nrounds: 627" + }, + { + "name": "benchmarks/nn/functional_benchmarks_test.py::test_vmap_mlp_speed_decorator[False-False]", + "value": 2530.7117514505803, + "unit": "iter/sec", + "range": "stddev: 0.00004238784489723879", + "extra": "mean: 395.14575274201394 usec\nrounds: 2370" + } + ] } ], "GPU Benchmark Results": [