From 80b7744ede804f04768f2e25f712b104418610e5 Mon Sep 17 00:00:00 2001 From: github-action-benchmark Date: Wed, 17 Jan 2024 15:42:18 +0000 Subject: [PATCH] add GPU Benchmark Results (pytest) benchmark result for 617a449ac6a684dccee0a5697c7d343e80342872 --- dev/bench/data.js | 950 +++++++++++++++++++++++++++++++++++++++++++++- 1 file changed, 949 insertions(+), 1 deletion(-) diff --git a/dev/bench/data.js b/dev/bench/data.js index 7a39842d0..1b1517c02 100644 --- a/dev/bench/data.js +++ b/dev/bench/data.js @@ -1,5 +1,5 @@ window.BENCHMARK_DATA = { - "lastUpdate": 1705506005938, + "lastUpdate": 1705506137512, "repoUrl": "https://github.com/pytorch/tensordict", "entries": { "CPU Benchmark Results": [ @@ -266944,6 +266944,954 @@ window.BENCHMARK_DATA = { "extra": "mean: 19.243306622615393 msec\nrounds: 53" } ] + }, + { + "commit": { + "author": { + "email": "vmoens@meta.com", + "name": "Vincent Moens", + "username": "vmoens" + }, + "committer": { + "email": "noreply@github.com", + "name": "GitHub", + "username": "web-flow" + }, + "distinct": true, + "id": "617a449ac6a684dccee0a5697c7d343e80342872", + "message": "[Feature] Improve the `empty` method (#622)", + "timestamp": "2024-01-17T15:29:22Z", + "tree_id": "4bb22a4b95527f625d75cb77a8622b32d4b866d6", + "url": "https://github.com/pytorch/tensordict/commit/617a449ac6a684dccee0a5697c7d343e80342872" + }, + "date": 1705506136028, + "tool": "pytest", + "benches": [ + { + "name": "benchmarks/common/common_ops_test.py::test_plain_set_nested", + "value": 76252.55544635771, + "unit": "iter/sec", + "range": "stddev: 7.309318969540794e-7", + "extra": "mean: 13.114314584558176 usec\nrounds: 22846" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_plain_set_stack_nested", + "value": 8583.557196478441, + "unit": "iter/sec", + "range": "stddev: 0.0000023500497226158862", + "extra": "mean: 116.50181586839872 usec\nrounds: 2987" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_plain_set_nested_inplace", + "value": 69132.32171618173, + "unit": "iter/sec", + "range": "stddev: 6.883418001866647e-7", + "extra": "mean: 14.465013978634122 usec\nrounds: 47215" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_plain_set_stack_nested_inplace", + "value": 6934.344772195376, + "unit": "iter/sec", + "range": "stddev: 0.0000027665885823826287", + "extra": "mean: 144.20973182782856 usec\nrounds: 5269" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_items", + "value": 208476.16153273004, + "unit": "iter/sec", + "range": "stddev: 3.5068849036770574e-7", + "extra": "mean: 4.796711492805394 usec\nrounds: 107980" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_items_nested", + "value": 2944.3119640164223, + "unit": "iter/sec", + "range": "stddev: 0.0000036147370294605253", + "extra": "mean: 339.6379229583643 usec\nrounds: 2596" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_items_nested_locked", + "value": 2901.9444248791956, + "unit": "iter/sec", + "range": "stddev: 0.00000486730040287498", + "extra": "mean: 344.5965372137093 usec\nrounds: 2096" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_items_nested_leaf", + "value": 4951.208481070527, + "unit": "iter/sec", + "range": "stddev: 0.000003195564236991728", + "extra": "mean: 201.97089333305243 usec\nrounds: 4725" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_items_stack_nested", + "value": 766.6873526864489, + "unit": "iter/sec", + "range": "stddev: 0.00001133009397613122", + "extra": "mean: 1.3043126334300816 msec\nrounds: 682" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_items_stack_nested_leaf", + "value": 883.5870749745258, + "unit": "iter/sec", + "range": "stddev: 0.000014349760879517404", + "extra": "mean: 1.1317503710982084 msec\nrounds: 865" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_items_stack_nested_locked", + "value": 1106.2380913463378, + "unit": "iter/sec", + "range": "stddev: 0.000008741190862499365", + "extra": "mean: 903.9645333338308 usec\nrounds: 1065" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_keys", + "value": 217618.7126998515, + "unit": "iter/sec", + "range": "stddev: 3.2017122413073523e-7", + "extra": "mean: 4.595193067699285 usec\nrounds: 121952" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_keys_nested", + "value": 10584.81136841202, + "unit": "iter/sec", + "range": "stddev: 0.000008398958255982002", + "extra": "mean: 94.47499489544747 usec\nrounds: 8424" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_keys_nested_locked", + "value": 10283.021995544303, + "unit": "iter/sec", + "range": "stddev: 0.000002059686713231721", + "extra": "mean: 97.24767684376309 usec\nrounds: 9531" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_keys_nested_leaf", + "value": 12855.855831034965, + "unit": "iter/sec", + "range": "stddev: 0.000002225373835165156", + "extra": "mean: 77.78556427071372 usec\nrounds: 10378" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_keys_stack_nested", + "value": 882.4982054749734, + "unit": "iter/sec", + "range": "stddev: 0.000024344427131841926", + "extra": "mean: 1.1331467801249357 msec\nrounds: 805" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_keys_stack_nested_leaf", + "value": 903.4909564054822, + "unit": "iter/sec", + "range": "stddev: 0.000015090076732456863", + "extra": "mean: 1.1068179409105288 msec\nrounds: 880" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_keys_stack_nested_locked", + "value": 1396.167050367997, + "unit": "iter/sec", + "range": "stddev: 0.000010520720096753975", + "extra": "mean: 716.2466695775576 usec\nrounds: 1374" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_values", + "value": 534028.7249834236, + "unit": "iter/sec", + "range": "stddev: 1.1489848567049214e-7", + "extra": "mean: 1.8725584471715766 usec\nrounds: 168919" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_values_nested", + "value": 22050.363083274497, + "unit": "iter/sec", + "range": "stddev: 0.0000013459106222731022", + "extra": "mean: 45.35072716142773 usec\nrounds: 17153" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_values_nested_locked", + "value": 20910.044314639996, + "unit": "iter/sec", + "range": "stddev: 0.0000013588791455034172", + "extra": "mean: 47.82390629846051 usec\nrounds: 19466" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_values_nested_leaf", + "value": 25275.696352392657, + "unit": "iter/sec", + "range": "stddev: 0.0000012951332420067553", + "extra": "mean: 39.56369731848506 usec\nrounds: 21706" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_values_stack_nested", + "value": 1054.1400376619279, + "unit": "iter/sec", + "range": "stddev: 0.000011899148256120717", + "extra": "mean: 948.6405641303502 usec\nrounds: 920" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_values_stack_nested_leaf", + "value": 1082.7830508584998, + "unit": "iter/sec", + "range": "stddev: 0.000012191633301009996", + "extra": "mean: 923.5460411087298 usec\nrounds: 1046" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_values_stack_nested_locked", + "value": 1752.9487103711679, + "unit": "iter/sec", + "range": "stddev: 0.000009571346359309306", + "extra": "mean: 570.4673468673598 usec\nrounds: 1724" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_membership", + "value": 1058023.8690258786, + "unit": "iter/sec", + "range": "stddev: 6.354098381310068e-8", + "extra": "mean: 945.158260862966 nsec\nrounds: 172385" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_membership_nested", + "value": 341320.57656888483, + "unit": "iter/sec", + "range": "stddev: 2.8561900729098884e-7", + "extra": "mean: 2.9297969962797756 usec\nrounds: 163667" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_membership_nested_leaf", + "value": 344015.1512192213, + "unit": "iter/sec", + "range": "stddev: 2.958746655072728e-7", + "extra": "mean: 2.906848714238045 usec\nrounds: 172118" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_membership_stacked_nested", + "value": 89373.50424947546, + "unit": "iter/sec", + "range": "stddev: 6.770138209488883e-7", + "extra": "mean: 11.18899844419907 usec\nrounds: 26997" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_membership_stacked_nested_leaf", + "value": 89034.84497383444, + "unit": "iter/sec", + "range": "stddev: 6.504718231968909e-7", + "extra": "mean: 11.231557715340328 usec\nrounds: 52629" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_membership_nested_last", + "value": 187309.92672716777, + "unit": "iter/sec", + "range": "stddev: 4.137883712878209e-7", + "extra": "mean: 5.338745348272875 usec\nrounds: 101523" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_membership_nested_leaf_last", + "value": 186443.6966647163, + "unit": "iter/sec", + "range": "stddev: 4.0950225940915497e-7", + "extra": "mean: 5.36354952132445 usec\nrounds: 111235" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_membership_stacked_nested_last", + "value": 7038.945320017973, + "unit": "iter/sec", + "range": "stddev: 0.000003090600728958881", + "extra": "mean: 142.06673791826623 usec\nrounds: 6063" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_membership_stacked_nested_leaf_last", + "value": 76424.13077060123, + "unit": "iter/sec", + "range": "stddev: 7.318124393199697e-7", + "extra": "mean: 13.084872407664715 usec\nrounds: 46147" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_nested_getleaf", + "value": 118803.99726470956, + "unit": "iter/sec", + "range": "stddev: 4.7261243150588976e-7", + "extra": "mean: 8.417225203053396 usec\nrounds: 94608" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_nested_get", + "value": 126040.06945224067, + "unit": "iter/sec", + "range": "stddev: 4.5291737082598995e-7", + "extra": "mean: 7.933984837884605 usec\nrounds: 93721" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_stacked_getleaf", + "value": 3127.877455613771, + "unit": "iter/sec", + "range": "stddev: 0.000005747292508988331", + "extra": "mean: 319.705619606435 usec\nrounds: 2642" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_stacked_get", + "value": 3493.427309610404, + "unit": "iter/sec", + "range": "stddev: 0.000004941009445321732", + "extra": "mean: 286.25184135047095 usec\nrounds: 3139" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_nested_getitemleaf", + "value": 118529.4978363636, + "unit": "iter/sec", + "range": "stddev: 4.597991037319982e-7", + "extra": "mean: 8.436718439325155 usec\nrounds: 78555" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_nested_getitem", + "value": 125542.89981783004, + "unit": "iter/sec", + "range": "stddev: 4.4030307432017816e-7", + "extra": "mean: 7.965404666062816 usec\nrounds: 92328" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_stacked_getitemleaf", + "value": 3094.4173128850666, + "unit": "iter/sec", + "range": "stddev: 0.000006165282026760021", + "extra": "mean: 323.16261799467975 usec\nrounds: 2623" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_stacked_getitem", + "value": 3466.5842993028227, + "unit": "iter/sec", + "range": "stddev: 0.000004595082427815806", + "extra": "mean: 288.4683924176064 usec\nrounds: 3086" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_lock_nested", + "value": 2492.068748229294, + "unit": "iter/sec", + "range": "stddev: 0.0000807805880351111", + "extra": "mean: 401.27303900044353 usec\nrounds: 1000" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_lock_stack_nested", + "value": 155.9258347212235, + "unit": "iter/sec", + "range": "stddev: 0.013782630059369916", + "extra": "mean: 6.41330541399941 msec\nrounds: 1000" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_unlock_nested", + "value": 2497.025811287362, + "unit": "iter/sec", + "range": "stddev: 0.00007284692060957593", + "extra": "mean: 400.47643699944047 usec\nrounds: 1000" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_unlock_stack_nested", + "value": 145.10729251708227, + "unit": "iter/sec", + "range": "stddev: 0.014659135505266855", + "extra": "mean: 6.891452405000791 msec\nrounds: 1000" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_flatten_speed", + "value": 3819.714199534573, + "unit": "iter/sec", + "range": "stddev: 0.000006672961851751692", + "extra": "mean: 261.79969174705496 usec\nrounds: 3296" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_unflatten_speed", + "value": 2774.6395925188162, + "unit": "iter/sec", + "range": "stddev: 0.000005678244436412449", + "extra": "mean: 360.4071688071749 usec\nrounds: 2725" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_common_ops", + "value": 1747.464517929739, + "unit": "iter/sec", + "range": "stddev: 0.000060843904963404574", + "extra": "mean: 572.2576852002252 usec\nrounds: 1223" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_creation", + "value": 647045.2055889365, + "unit": "iter/sec", + "range": "stddev: 2.0518537381655614e-7", + "extra": "mean: 1.5454870716332816 usec\nrounds: 149477" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_creation_empty", + "value": 139945.46819649995, + "unit": "iter/sec", + "range": "stddev: 5.318327258096988e-7", + "extra": "mean: 7.145640461868204 usec\nrounds: 36469" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_creation_nested_1", + "value": 112624.53537152632, + "unit": "iter/sec", + "range": "stddev: 5.91208850300943e-7", + "extra": "mean: 8.879059937527783 usec\nrounds: 41927" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_creation_nested_2", + "value": 88516.88142545137, + "unit": "iter/sec", + "range": "stddev: 7.206054769399675e-7", + "extra": "mean: 11.297280065635805 usec\nrounds: 38416" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_clone", + "value": 73544.9297278511, + "unit": "iter/sec", + "range": "stddev: 0.0000014909156736231994", + "extra": "mean: 13.597130403148718 usec\nrounds: 16472" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_getitem[int]", + "value": 93443.6366965145, + "unit": "iter/sec", + "range": "stddev: 6.986688119302434e-7", + "extra": "mean: 10.701638285416825 usec\nrounds: 20812" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_getitem[slice_int]", + "value": 46109.97711207683, + "unit": "iter/sec", + "range": "stddev: 0.00001658615909414075", + "extra": "mean: 21.687280337818393 usec\nrounds: 14693" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_getitem[range]", + "value": 27101.247850827323, + "unit": "iter/sec", + "range": "stddev: 0.000002406390395843203", + "extra": "mean: 36.89866996177716 usec\nrounds: 6272" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_getitem[tuple]", + "value": 53738.19972113495, + "unit": "iter/sec", + "range": "stddev: 0.0000011091004149283366", + "extra": "mean: 18.608736526145762 usec\nrounds: 24492" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_getitem[list]", + "value": 29735.79869111735, + "unit": "iter/sec", + "range": "stddev: 0.0000036917561712700607", + "extra": "mean: 33.629498584772136 usec\nrounds: 15193" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_setitem_dim[int]", + "value": 36851.73559263666, + "unit": "iter/sec", + "range": "stddev: 0.0000017817528023541154", + "extra": "mean: 27.13576399912654 usec\nrounds: 1000" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_setitem_dim[slice_int]", + "value": 20489.32020793459, + "unit": "iter/sec", + "range": "stddev: 0.00000244118151053785", + "extra": "mean: 48.805914000638495 usec\nrounds: 1000" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_setitem_dim[range]", + "value": 15925.206059523318, + "unit": "iter/sec", + "range": "stddev: 0.0000027483864110894066", + "extra": "mean: 62.79353599961723 usec\nrounds: 1000" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_setitem_dim[tuple]", + "value": 24710.754441798257, + "unit": "iter/sec", + "range": "stddev: 0.0000023136121689869186", + "extra": "mean: 40.468209999630744 usec\nrounds: 1000" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_setitem", + "value": 55196.96587593409, + "unit": "iter/sec", + "range": "stddev: 0.000001991309183357779", + "extra": "mean: 18.116937844875288 usec\nrounds: 25195" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_set", + "value": 56670.516720257416, + "unit": "iter/sec", + "range": "stddev: 0.0000017488639964467573", + "extra": "mean: 17.645859926358153 usec\nrounds: 26329" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_set_shared", + "value": 9821.536496642768, + "unit": "iter/sec", + "range": "stddev: 0.00007181246298153688", + "extra": "mean: 101.81706297602452 usec\nrounds: 5256" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_update", + "value": 52041.22297707689, + "unit": "iter/sec", + "range": "stddev: 0.0000019271385639898283", + "extra": "mean: 19.215536122978506 usec\nrounds: 30922" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_update_nested", + "value": 38739.6973820428, + "unit": "iter/sec", + "range": "stddev: 0.0000020224217929729497", + "extra": "mean: 25.813314702440984 usec\nrounds: 26336" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_set_nested", + "value": 54256.078807497455, + "unit": "iter/sec", + "range": "stddev: 0.0000018478691963227454", + "extra": "mean: 18.431114484849456 usec\nrounds: 24143" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_set_nested_new", + "value": 45230.078259254355, + "unit": "iter/sec", + "range": "stddev: 0.000002012487068147836", + "extra": "mean: 22.109181290116243 usec\nrounds: 22202" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_select", + "value": 29035.859556992506, + "unit": "iter/sec", + "range": "stddev: 0.0000024135561033610243", + "extra": "mean: 34.44017209262114 usec\nrounds: 14161" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_select_nested", + "value": 17929.557379961003, + "unit": "iter/sec", + "range": "stddev: 0.0000016176090398108122", + "extra": "mean: 55.7738252433187 usec\nrounds: 14483" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_exclude_nested", + "value": 9077.480163373666, + "unit": "iter/sec", + "range": "stddev: 0.0000032205606724986138", + "extra": "mean: 110.16273040560937 usec\nrounds: 6239" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_empty[True]", + "value": 3126.2681644851496, + "unit": "iter/sec", + "range": "stddev: 0.000004847489015015754", + "extra": "mean: 319.8701926341899 usec\nrounds: 706" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_empty[False]", + "value": 1161164.2415253264, + "unit": "iter/sec", + "range": "stddev: 4.4416702100666184e-8", + "extra": "mean: 861.2046119215538 nsec\nrounds: 111732" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_to", + "value": 19405.79457143177, + "unit": "iter/sec", + "range": "stddev: 0.00001086482170457514", + "extra": "mean: 51.53099999688493 usec\nrounds: 5" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_to_nonblocking", + "value": 31192.473969069557, + "unit": "iter/sec", + "range": "stddev: 0.0000019049809803046943", + "extra": "mean: 32.059015292970976 usec\nrounds: 12424" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_unbind_speed", + "value": 3155.5046243906586, + "unit": "iter/sec", + "range": "stddev: 0.000004915427111324335", + "extra": "mean: 316.9065233720278 usec\nrounds: 2503" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_unbind_speed_stack0", + "value": 251.09201815438482, + "unit": "iter/sec", + "range": "stddev: 0.006450207484660705", + "extra": "mean: 3.9826036978409505 msec\nrounds: 278" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_unbind_speed_stack1", + "value": 1878589.3224166087, + "unit": "iter/sec", + "range": "stddev: 2.0915261817215048e-8", + "extra": "mean: 532.3143212129121 nsec\nrounds: 87559" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_split", + "value": 644.5365536761487, + "unit": "iter/sec", + "range": "stddev: 0.000017383049408798775", + "extra": "mean: 1.5515023846148779 msec\nrounds: 520" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_chunk", + "value": 599.448115315658, + "unit": "iter/sec", + "range": "stddev: 0.003054692252973103", + "extra": "mean: 1.668201091054259 msec\nrounds: 626" + }, + { + "name": "benchmarks/common/memmap_benchmarks_test.py::test_creation[device0]", + "value": 14168.360859421193, + "unit": "iter/sec", + "range": "stddev: 0.000004659564395545662", + "extra": "mean: 70.5797946510555 usec\nrounds: 3029" + }, + { + "name": "benchmarks/common/memmap_benchmarks_test.py::test_creation_from_tensor", + "value": 19107.76769894165, + "unit": "iter/sec", + "range": "stddev: 0.000004548206465456448", + "extra": "mean: 52.334737147520826 usec\nrounds: 9142" + }, + { + "name": "benchmarks/common/memmap_benchmarks_test.py::test_add_one[memmap_tensor0]", + "value": 152883.21773756325, + "unit": "iter/sec", + "range": "stddev: 0.0000016957567849426654", + "extra": "mean: 6.540940299389715 usec\nrounds: 16499" + }, + { + "name": "benchmarks/common/memmap_benchmarks_test.py::test_contiguous[memmap_tensor0]", + "value": 1643123.0118050128, + "unit": "iter/sec", + "range": "stddev: 1.2015303507723863e-7", + "extra": "mean: 608.597160903659 nsec\nrounds: 95594" + }, + { + "name": "benchmarks/common/memmap_benchmarks_test.py::test_stack[memmap_tensor0]", + "value": 223863.61805667376, + "unit": "iter/sec", + "range": "stddev: 6.950734708492935e-7", + "extra": "mean: 4.467005441441753 usec\nrounds: 30507" + }, + { + "name": "benchmarks/common/memmap_benchmarks_test.py::test_memmaptd_index", + "value": 3914.581170250093, + "unit": "iter/sec", + "range": "stddev: 0.00006207778052475779", + "extra": "mean: 255.4551704278781 usec\nrounds: 2083" + }, + { + "name": "benchmarks/common/memmap_benchmarks_test.py::test_memmaptd_index_astensor", + "value": 3209.505408290229, + "unit": "iter/sec", + "range": "stddev: 0.0000569928965993791", + "extra": "mean: 311.57448665360596 usec\nrounds: 3072" + }, + { + "name": "benchmarks/common/memmap_benchmarks_test.py::test_memmaptd_index_op", + "value": 1740.8627587846427, + "unit": "iter/sec", + "range": "stddev: 0.00006537620362146479", + "extra": "mean: 574.4278203171715 usec\nrounds: 1703" + }, + { + "name": "benchmarks/common/memmap_benchmarks_test.py::test_serialize_model", + "value": 9.826909419384986, + "unit": "iter/sec", + "range": "stddev: 0.028252712989114054", + "extra": "mean: 101.76139387500172 msec\nrounds: 8" + }, + { + "name": "benchmarks/common/memmap_benchmarks_test.py::test_serialize_model_pickle", + "value": 0.8089386118142718, + "unit": "iter/sec", + "range": "stddev: 0.2626550222230022", + "extra": "mean: 1.2361877470000096 sec\nrounds: 8" + }, + { + "name": "benchmarks/common/memmap_benchmarks_test.py::test_serialize_weights", + "value": 9.882084436224599, + "unit": "iter/sec", + "range": "stddev: 0.028674716112563545", + "extra": "mean: 101.19322562498212 msec\nrounds: 8" + }, + { + "name": "benchmarks/common/memmap_benchmarks_test.py::test_serialize_weights_returnearly", + "value": 13.086035270835202, + "unit": "iter/sec", + "range": "stddev: 0.05864033147932727", + "extra": "mean: 76.41733949997034 msec\nrounds: 18" + }, + { + "name": "benchmarks/common/memmap_benchmarks_test.py::test_serialize_weights_pickle", + "value": 0.8047117831155723, + "unit": "iter/sec", + "range": "stddev: 0.24879713018681793", + "extra": "mean: 1.242680946125006 sec\nrounds: 8" + }, + { + "name": "benchmarks/common/pytree_benchmarks_test.py::test_reshape_pytree", + "value": 41042.58316255604, + "unit": "iter/sec", + "range": "stddev: 0.0000023042717295441864", + "extra": "mean: 24.364938143374946 usec\nrounds: 11187" + }, + { + "name": "benchmarks/common/pytree_benchmarks_test.py::test_reshape_td", + "value": 35182.58930573591, + "unit": "iter/sec", + "range": "stddev: 0.000001437222527777013", + "extra": "mean: 28.42314962409453 usec\nrounds: 9965" + }, + { + "name": "benchmarks/common/pytree_benchmarks_test.py::test_view_pytree", + "value": 41536.18785306281, + "unit": "iter/sec", + "range": "stddev: 0.0000013609333540217584", + "extra": "mean: 24.075391885687015 usec\nrounds: 22282" + }, + { + "name": "benchmarks/common/pytree_benchmarks_test.py::test_view_td", + "value": 236348.83251731572, + "unit": "iter/sec", + "range": "stddev: 0.000001169511543785945", + "extra": "mean: 4.231034227455879 usec\nrounds: 36024" + }, + { + "name": "benchmarks/common/pytree_benchmarks_test.py::test_unbind_pytree", + "value": 33121.71551708888, + "unit": "iter/sec", + "range": "stddev: 0.0000014737221529950982", + "extra": "mean: 30.191672876486674 usec\nrounds: 15138" + }, + { + "name": "benchmarks/common/pytree_benchmarks_test.py::test_unbind_td", + "value": 20138.210790264904, + "unit": "iter/sec", + "range": "stddev: 0.000002516721263551362", + "extra": "mean: 49.65684441457004 usec\nrounds: 12257" + }, + { + "name": "benchmarks/common/pytree_benchmarks_test.py::test_split_pytree", + "value": 35980.505407575205, + "unit": "iter/sec", + "range": "stddev: 0.0000014156950985591026", + "extra": "mean: 27.792828051533252 usec\nrounds: 12085" + }, + { + "name": "benchmarks/common/pytree_benchmarks_test.py::test_split_td", + "value": 25256.920636535055, + "unit": "iter/sec", + "range": "stddev: 0.000006156155168189263", + "extra": "mean: 39.59310853412049 usec\nrounds: 13885" + }, + { + "name": "benchmarks/common/pytree_benchmarks_test.py::test_add_pytree", + "value": 28208.232070546434, + "unit": "iter/sec", + "range": "stddev: 0.0000017881867387187355", + "extra": "mean: 35.45064424807211 usec\nrounds: 10631" + }, + { + "name": "benchmarks/common/pytree_benchmarks_test.py::test_add_td", + "value": 21371.971888977492, + "unit": "iter/sec", + "range": "stddev: 0.000002323222595875216", + "extra": "mean: 46.79025431975914 usec\nrounds: 11576" + }, + { + "name": "benchmarks/distributed/distributed_benchmark_test.py::test_distributed", + "value": 13988.771483458637, + "unit": "iter/sec", + "range": "stddev: 0.000010959532566014032", + "extra": "mean: 71.48590576252349 usec\nrounds: 4616" + }, + { + "name": "benchmarks/nn/functional_benchmarks_test.py::test_tdmodule", + "value": 56244.03883832058, + "unit": "iter/sec", + "range": "stddev: 0.0000022770687486159877", + "extra": "mean: 17.77966199892944 usec\nrounds: 1000" + }, + { + "name": "benchmarks/nn/functional_benchmarks_test.py::test_tdmodule_dispatch", + "value": 29225.00147350328, + "unit": "iter/sec", + "range": "stddev: 0.00001635705859845901", + "extra": "mean: 34.217278001051454 usec\nrounds: 1000" + }, + { + "name": "benchmarks/nn/functional_benchmarks_test.py::test_tdseq", + "value": 48358.8785951357, + "unit": "iter/sec", + "range": "stddev: 0.0000023440124228307075", + "extra": "mean: 20.67872599718612 usec\nrounds: 1000" + }, + { + "name": "benchmarks/nn/functional_benchmarks_test.py::test_tdseq_dispatch", + "value": 29019.43812210339, + "unit": "iter/sec", + "range": "stddev: 0.000002030678392367655", + "extra": "mean: 34.45966099661746 usec\nrounds: 1000" + }, + { + "name": "benchmarks/nn/functional_benchmarks_test.py::test_instantiation_functorch", + "value": 605.8118911080263, + "unit": "iter/sec", + "range": "stddev: 0.000022913325007916686", + "extra": "mean: 1.6506774044514148 msec\nrounds: 539" + }, + { + "name": "benchmarks/nn/functional_benchmarks_test.py::test_instantiation_td", + "value": 861.8115620652973, + "unit": "iter/sec", + "range": "stddev: 0.00011002448789906101", + "extra": "mean: 1.1603464655353888 msec\nrounds: 885" + }, + { + "name": "benchmarks/nn/functional_benchmarks_test.py::test_exec_functorch", + "value": 6327.858521484343, + "unit": "iter/sec", + "range": "stddev: 0.000003913424071109501", + "extra": "mean: 158.03134608727427 usec\nrounds: 2901" + }, + { + "name": "benchmarks/nn/functional_benchmarks_test.py::test_exec_functional_call", + "value": 6418.558049758357, + "unit": "iter/sec", + "range": "stddev: 0.000004186947522988374", + "extra": "mean: 155.79823260111323 usec\nrounds: 4368" + }, + { + "name": "benchmarks/nn/functional_benchmarks_test.py::test_exec_td", + "value": 6915.94926028983, + "unit": "iter/sec", + "range": "stddev: 0.000004700157239333874", + "extra": "mean: 144.59331067418682 usec\nrounds: 2501" + }, + { + "name": "benchmarks/nn/functional_benchmarks_test.py::test_exec_td_decorator", + "value": 5429.530281600182, + "unit": "iter/sec", + "range": "stddev: 0.00004521525144766291", + "extra": "mean: 184.177994805341 usec\nrounds: 4043" + }, + { + "name": "benchmarks/nn/functional_benchmarks_test.py::test_vmap_mlp_speed[True-True]", + "value": 937.2778943128045, + "unit": "iter/sec", + "range": "stddev: 0.000025437239918202086", + "extra": "mean: 1.0669194334655487 msec\nrounds: 759" + }, + { + "name": "benchmarks/nn/functional_benchmarks_test.py::test_vmap_mlp_speed[True-False]", + "value": 1577.1887209714698, + "unit": "iter/sec", + "range": "stddev: 0.000019427729925500887", + "extra": "mean: 634.0395329381063 usec\nrounds: 1518" + }, + { + "name": "benchmarks/nn/functional_benchmarks_test.py::test_vmap_mlp_speed[False-True]", + "value": 1033.6671269549588, + "unit": "iter/sec", + "range": "stddev: 0.000010308911687254855", + "extra": "mean: 967.4294305419796 usec\nrounds: 1015" + }, + { + "name": "benchmarks/nn/functional_benchmarks_test.py::test_vmap_mlp_speed[False-False]", + "value": 1780.0303962604662, + "unit": "iter/sec", + "range": "stddev: 0.000008307105482514186", + "extra": "mean: 561.7881594049326 usec\nrounds: 1744" + }, + { + "name": "benchmarks/nn/functional_benchmarks_test.py::test_vmap_mlp_speed_decorator[True-True]", + "value": 410.92230126843884, + "unit": "iter/sec", + "range": "stddev: 0.00007144879164587662", + "extra": "mean: 2.4335500821279124 msec\nrounds: 414" + }, + { + "name": "benchmarks/nn/functional_benchmarks_test.py::test_vmap_mlp_speed_decorator[True-False]", + "value": 1478.5134259260242, + "unit": "iter/sec", + "range": "stddev: 0.00004170301575786401", + "extra": "mean: 676.355035040469 usec\nrounds: 1484" + }, + { + "name": "benchmarks/nn/functional_benchmarks_test.py::test_vmap_mlp_speed_decorator[False-True]", + "value": 488.77486404637534, + "unit": "iter/sec", + "range": "stddev: 0.0000739050476256088", + "extra": "mean: 2.0459317234961563 msec\nrounds: 434" + }, + { + "name": "benchmarks/nn/functional_benchmarks_test.py::test_vmap_mlp_speed_decorator[False-False]", + "value": 1697.0301694497668, + "unit": "iter/sec", + "range": "stddev: 0.00003754665048609404", + "extra": "mean: 589.2647155025139 usec\nrounds: 1645" + }, + { + "name": "benchmarks/nn/functional_benchmarks_test.py::test_vmap_transformer_speed[True-True]", + "value": 84.23111670737116, + "unit": "iter/sec", + "range": "stddev: 0.00016467332034838245", + "extra": "mean: 11.87209714284233 msec\nrounds: 84" + }, + { + "name": "benchmarks/nn/functional_benchmarks_test.py::test_vmap_transformer_speed[True-False]", + "value": 127.20522171171383, + "unit": "iter/sec", + "range": "stddev: 0.00013095487358084248", + "extra": "mean: 7.861312503871168 msec\nrounds: 129" + }, + { + "name": "benchmarks/nn/functional_benchmarks_test.py::test_vmap_transformer_speed[False-True]", + "value": 85.42049751841112, + "unit": "iter/sec", + "range": "stddev: 0.0000496432000740668", + "extra": "mean: 11.706792035301184 msec\nrounds: 85" + }, + { + "name": "benchmarks/nn/functional_benchmarks_test.py::test_vmap_transformer_speed[False-False]", + "value": 129.74226549104026, + "unit": "iter/sec", + "range": "stddev: 0.00003423405237060706", + "extra": "mean: 7.707588550386905 msec\nrounds: 129" + }, + { + "name": "benchmarks/nn/functional_benchmarks_test.py::test_vmap_transformer_speed_decorator[True-True]", + "value": 13.79369476970213, + "unit": "iter/sec", + "range": "stddev: 0.00041844481535642324", + "extra": "mean: 72.49689199999564 msec\nrounds: 14" + }, + { + "name": "benchmarks/nn/functional_benchmarks_test.py::test_vmap_transformer_speed_decorator[True-False]", + "value": 53.762026621132904, + "unit": "iter/sec", + "range": "stddev: 0.0004038421842096363", + "extra": "mean: 18.60048928302338 msec\nrounds: 53" + }, + { + "name": "benchmarks/nn/functional_benchmarks_test.py::test_vmap_transformer_speed_decorator[False-True]", + "value": 15.264718724775543, + "unit": "iter/sec", + "range": "stddev: 0.0004827200383198114", + "extra": "mean: 65.51054218751773 msec\nrounds: 16" + }, + { + "name": "benchmarks/nn/functional_benchmarks_test.py::test_vmap_transformer_speed_decorator[False-False]", + "value": 49.99425929553982, + "unit": "iter/sec", + "range": "stddev: 0.012787158359703753", + "extra": "mean: 20.002296545459846 msec\nrounds: 55" + } + ] } ] }