From d097d50a421efb29a5dea54e87a4c3cc28f27fa3 Mon Sep 17 00:00:00 2001 From: github-action-benchmark Date: Thu, 12 Dec 2024 17:40:11 +0000 Subject: [PATCH] add GPU Benchmark Results (pytest) benchmark result for eb4a56ed687cf7f15e4182645f1c35e738231664 --- dev/bench/data.js | 1629 ++++++++++++++++++++++++++++++++++++++++++++- 1 file changed, 1628 insertions(+), 1 deletion(-) diff --git a/dev/bench/data.js b/dev/bench/data.js index bc48ef0ff..1c9d61b93 100644 --- a/dev/bench/data.js +++ b/dev/bench/data.js @@ -1,5 +1,5 @@ window.BENCHMARK_DATA = { - "lastUpdate": 1734025023585, + "lastUpdate": 1734025210829, "repoUrl": "https://github.com/pytorch/tensordict", "entries": { "CPU Benchmark Results": [ @@ -736364,6 +736364,1633 @@ window.BENCHMARK_DATA = { "extra": "mean: 51.2013188421059 msec\nrounds: 19" } ] + }, + { + "commit": { + "author": { + "email": "vmoens@meta.com", + "name": "Vincent Moens", + "username": "vmoens" + }, + "committer": { + "email": "vmoens@meta.com", + "name": "Vincent Moens", + "username": "vmoens" + }, + "distinct": true, + "id": "eb4a56ed687cf7f15e4182645f1c35e738231664", + "message": "[BugFix] Better comparison of tensorclasses\n\nghstack-source-id: 8def6f01f2b6d09714319a56f96b166ac1fd49d5\nPull Request resolved: https://github.com/pytorch/tensordict/pull/1137", + "timestamp": "2024-12-12T09:28:55-08:00", + "tree_id": "8def6f01f2b6d09714319a56f96b166ac1fd49d5", + "url": "https://github.com/pytorch/tensordict/commit/eb4a56ed687cf7f15e4182645f1c35e738231664" + }, + "date": 1734025178470, + "tool": "pytest", + "benches": [ + { + "name": "benchmarks/common/common_ops_test.py::test_plain_set_nested", + "value": 90848.36449169528, + "unit": "iter/sec", + "range": "stddev: 6.730365868976647e-7", + "extra": "mean: 11.00735280811151 usec\nrounds: 20161" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_plain_set_stack_nested", + "value": 89697.762158992, + "unit": "iter/sec", + "range": "stddev: 5.765255610144883e-7", + "extra": "mean: 11.148550152538586 usec\nrounds: 23122" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_plain_set_nested_inplace", + "value": 82816.34063145187, + "unit": "iter/sec", + "range": "stddev: 8.10722354978611e-7", + "extra": "mean: 12.074911694664053 usec\nrounds: 45370" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_plain_set_stack_nested_inplace", + "value": 83233.60982848532, + "unit": "iter/sec", + "range": "stddev: 7.213114728098676e-7", + "extra": "mean: 12.014377389862606 usec\nrounds: 52939" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_items", + "value": 343650.8708547817, + "unit": "iter/sec", + "range": "stddev: 2.776609943181714e-7", + "extra": "mean: 2.9099300621955213 usec\nrounds: 97457" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_items_nested", + "value": 2893.9784050572293, + "unit": "iter/sec", + "range": "stddev: 0.000005376197845780773", + "extra": "mean: 345.54508017492435 usec\nrounds: 2619" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_items_nested_locked", + "value": 2881.9416441782805, + "unit": "iter/sec", + "range": "stddev: 0.000004983201573942779", + "extra": "mean: 346.98828896139116 usec\nrounds: 2799" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_items_nested_leaf", + "value": 17285.211257885116, + "unit": "iter/sec", + "range": "stddev: 0.0000016279332846690772", + "extra": "mean: 57.85292323481572 usec\nrounds: 12702" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_items_stack_nested", + "value": 2876.6384971338807, + "unit": "iter/sec", + "range": "stddev: 0.000005265191788027093", + "extra": "mean: 347.6279695889293 usec\nrounds: 2665" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_items_stack_nested_leaf", + "value": 16870.120045041902, + "unit": "iter/sec", + "range": "stddev: 0.000001832241398997544", + "extra": "mean: 59.276400958029825 usec\nrounds: 13501" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_items_stack_nested_locked", + "value": 2846.9195375132967, + "unit": "iter/sec", + "range": "stddev: 0.0000055138966160811105", + "extra": "mean: 351.25685388125567 usec\nrounds: 2785" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_keys", + "value": 287657.5187929735, + "unit": "iter/sec", + "range": "stddev: 3.189812578436954e-7", + "extra": "mean: 3.4763562037107674 usec\nrounds: 154560" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_keys_nested", + "value": 14192.378864673577, + "unit": "iter/sec", + "range": "stddev: 0.0000019653416863459205", + "extra": "mean: 70.46035125859781 usec\nrounds: 9984" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_keys_nested_locked", + "value": 13222.425933320765, + "unit": "iter/sec", + "range": "stddev: 0.000006808935471778719", + "extra": "mean: 75.62908690454307 usec\nrounds: 11921" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_keys_nested_leaf", + "value": 16255.621312796642, + "unit": "iter/sec", + "range": "stddev: 0.0000017968576889356626", + "extra": "mean: 61.51718108816835 usec\nrounds: 9631" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_keys_stack_nested", + "value": 14239.887623943128, + "unit": "iter/sec", + "range": "stddev: 0.0000020569438707520846", + "extra": "mean: 70.22527328927703 usec\nrounds: 12360" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_keys_stack_nested_leaf", + "value": 16361.65286317423, + "unit": "iter/sec", + "range": "stddev: 0.0000022266847885208377", + "extra": "mean: 61.11851952627211 usec\nrounds: 13818" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_keys_stack_nested_locked", + "value": 13317.232937323442, + "unit": "iter/sec", + "range": "stddev: 0.0000025403223585040456", + "extra": "mean: 75.09067421936861 usec\nrounds: 12263" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_values", + "value": 1185991.1970161698, + "unit": "iter/sec", + "range": "stddev: 5.935088359335268e-8", + "extra": "mean: 843.1765788109522 nsec\nrounds: 189359" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_values_nested", + "value": 31809.41021229369, + "unit": "iter/sec", + "range": "stddev: 0.000001124910373833511", + "extra": "mean: 31.43723801623711 usec\nrounds: 22763" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_values_nested_locked", + "value": 30282.24183940314, + "unit": "iter/sec", + "range": "stddev: 0.000002633219164054884", + "extra": "mean: 33.02265417809337 usec\nrounds: 26925" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_values_nested_leaf", + "value": 29797.70955836987, + "unit": "iter/sec", + "range": "stddev: 0.0000010863875377382929", + "extra": "mean: 33.559626388099694 usec\nrounds: 22124" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_values_stack_nested", + "value": 30787.00916825697, + "unit": "iter/sec", + "range": "stddev: 0.0000011319352980433423", + "extra": "mean: 32.481232409904 usec\nrounds: 23827" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_values_stack_nested_leaf", + "value": 28691.71989827214, + "unit": "iter/sec", + "range": "stddev: 0.000001174568492637438", + "extra": "mean: 34.85326092494795 usec\nrounds: 23883" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_values_stack_nested_locked", + "value": 29298.042831806215, + "unit": "iter/sec", + "range": "stddev: 0.0000012752349972818596", + "extra": "mean: 34.13197276489716 usec\nrounds: 26233" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_membership", + "value": 1783862.043292478, + "unit": "iter/sec", + "range": "stddev: 2.7997849664070242e-8", + "extra": "mean: 560.5814663528004 nsec\nrounds: 87413" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_membership_nested", + "value": 495637.68607128813, + "unit": "iter/sec", + "range": "stddev: 3.0862377442754597e-7", + "extra": "mean: 2.0176028338897716 usec\nrounds: 197629" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_membership_nested_leaf", + "value": 511255.56761797756, + "unit": "iter/sec", + "range": "stddev: 1.7149797156792155e-7", + "extra": "mean: 1.9559689191438283 usec\nrounds: 193424" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_membership_stacked_nested", + "value": 474567.40587596217, + "unit": "iter/sec", + "range": "stddev: 2.84399500741569e-7", + "extra": "mean: 2.1071822203090163 usec\nrounds: 81901" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_membership_stacked_nested_leaf", + "value": 485249.6248070941, + "unit": "iter/sec", + "range": "stddev: 2.592502669186534e-7", + "extra": "mean: 2.060794998857628 usec\nrounds: 142654" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_membership_nested_last", + "value": 346473.4690209603, + "unit": "iter/sec", + "range": "stddev: 3.3136315278055025e-7", + "extra": "mean: 2.8862238797842954 usec\nrounds: 150603" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_membership_nested_leaf_last", + "value": 343016.0473250236, + "unit": "iter/sec", + "range": "stddev: 3.0692241841899494e-7", + "extra": "mean: 2.915315501412835 usec\nrounds: 167505" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_membership_stacked_nested_last", + "value": 127285.04251738776, + "unit": "iter/sec", + "range": "stddev: 5.809995989755761e-7", + "extra": "mean: 7.856382652843087 usec\nrounds: 39262" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_membership_stacked_nested_leaf_last", + "value": 126981.82559235435, + "unit": "iter/sec", + "range": "stddev: 5.167689590897718e-7", + "extra": "mean: 7.8751427248358175 usec\nrounds: 61687" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_nested_getleaf", + "value": 163812.3659298786, + "unit": "iter/sec", + "range": "stddev: 4.286792387605892e-7", + "extra": "mean: 6.1045452479946425 usec\nrounds: 100797" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_nested_get", + "value": 173031.12868866968, + "unit": "iter/sec", + "range": "stddev: 4.056287599779378e-7", + "extra": "mean: 5.779306923433838 usec\nrounds: 116823" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_stacked_getleaf", + "value": 164582.02500871662, + "unit": "iter/sec", + "range": "stddev: 4.3677089303080905e-7", + "extra": "mean: 6.075997667102697 usec\nrounds: 65964" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_stacked_get", + "value": 171877.54042938512, + "unit": "iter/sec", + "range": "stddev: 4.3374738882774376e-7", + "extra": "mean: 5.818095822768911 usec\nrounds: 87405" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_nested_getitemleaf", + "value": 161291.02693366093, + "unit": "iter/sec", + "range": "stddev: 5.039688442741214e-7", + "extra": "mean: 6.1999729247883115 usec\nrounds: 66402" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_nested_getitem", + "value": 170557.27547505862, + "unit": "iter/sec", + "range": "stddev: 5.289762954378317e-7", + "extra": "mean: 5.863133057295081 usec\nrounds: 100402" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_stacked_getitemleaf", + "value": 160900.4905853959, + "unit": "iter/sec", + "range": "stddev: 5.244006859909791e-7", + "extra": "mean: 6.215021448112135 usec\nrounds: 59666" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_stacked_getitem", + "value": 170518.50623845085, + "unit": "iter/sec", + "range": "stddev: 4.83965716824648e-7", + "extra": "mean: 5.864466104351237 usec\nrounds: 82441" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_lock_nested", + "value": 2743.0893854759297, + "unit": "iter/sec", + "range": "stddev: 0.0002802111867281729", + "extra": "mean: 364.552466024179 usec\nrounds: 1000" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_lock_stack_nested", + "value": 3082.735655936109, + "unit": "iter/sec", + "range": "stddev: 0.000009869042007387711", + "extra": "mean: 324.38720396748977 usec\nrounds: 1000" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_unlock_nested", + "value": 3354.1756439628425, + "unit": "iter/sec", + "range": "stddev: 0.00006095994961198411", + "extra": "mean: 298.13584801377147 usec\nrounds: 1000" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_unlock_stack_nested", + "value": 3778.951558003569, + "unit": "iter/sec", + "range": "stddev: 0.000009955052565031484", + "extra": "mean: 264.62366205305443 usec\nrounds: 1000" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_flatten_speed", + "value": 13364.292315286712, + "unit": "iter/sec", + "range": "stddev: 0.0000032267229917372406", + "extra": "mean: 74.82625913952454 usec\nrounds: 8999" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_unflatten_speed", + "value": 3278.4825577821907, + "unit": "iter/sec", + "range": "stddev: 0.000005242369620988693", + "extra": "mean: 305.01916126602003 usec\nrounds: 3013" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_common_ops", + "value": 1686.900093755517, + "unit": "iter/sec", + "range": "stddev: 0.00013112101800029125", + "extra": "mean: 592.8033341759541 usec\nrounds: 1245" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_creation", + "value": 674971.9962944133, + "unit": "iter/sec", + "range": "stddev: 3.8793119873351837e-7", + "extra": "mean: 1.4815429462110812 usec\nrounds: 168068" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_creation_empty", + "value": 120899.41642880421, + "unit": "iter/sec", + "range": "stddev: 0.000009300120173034124", + "extra": "mean: 8.271338518733748 usec\nrounds: 28217" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_creation_nested_1", + "value": 99976.00431467133, + "unit": "iter/sec", + "range": "stddev: 6.83354261045346e-7", + "extra": "mean: 10.00240014446398 usec\nrounds: 36139" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_creation_nested_2", + "value": 80526.19881063265, + "unit": "iter/sec", + "range": "stddev: 7.143836279691812e-7", + "extra": "mean: 12.418318693418327 usec\nrounds: 33511" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_clone", + "value": 99523.62035882038, + "unit": "iter/sec", + "range": "stddev: 6.946119975959607e-7", + "extra": "mean: 10.047865987939556 usec\nrounds: 17819" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_getitem[int]", + "value": 94783.1609053331, + "unit": "iter/sec", + "range": "stddev: 0.000012017627850243833", + "extra": "mean: 10.550397248291532 usec\nrounds: 14588" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_getitem[slice_int]", + "value": 50353.81933355456, + "unit": "iter/sec", + "range": "stddev: 0.000006828512700186184", + "extra": "mean: 19.859466734306377 usec\nrounds: 10668" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_getitem[range]", + "value": 27699.458034564585, + "unit": "iter/sec", + "range": "stddev: 0.000008052144853465404", + "extra": "mean: 36.10178938346579 usec\nrounds: 5977" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_getitem[tuple]", + "value": 57007.88153277871, + "unit": "iter/sec", + "range": "stddev: 0.000006639794266712505", + "extra": "mean: 17.54143415108338 usec\nrounds: 25484" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_getitem[list]", + "value": 31738.78189654022, + "unit": "iter/sec", + "range": "stddev: 0.000008449558402672314", + "extra": "mean: 31.507195306351942 usec\nrounds: 13809" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_setitem_dim[int]", + "value": 55108.080756263495, + "unit": "iter/sec", + "range": "stddev: 0.000002148813338109569", + "extra": "mean: 18.146159080060897 usec\nrounds: 1000" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_setitem_dim[slice_int]", + "value": 26872.401071427408, + "unit": "iter/sec", + "range": "stddev: 0.0000028990564204223177", + "extra": "mean: 37.212900973827345 usec\nrounds: 1000" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_setitem_dim[range]", + "value": 19563.85973781249, + "unit": "iter/sec", + "range": "stddev: 0.000002921633821288745", + "extra": "mean: 51.11465801746817 usec\nrounds: 1000" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_setitem_dim[tuple]", + "value": 32219.67945313913, + "unit": "iter/sec", + "range": "stddev: 0.0000017361723832960912", + "extra": "mean: 31.036931992275637 usec\nrounds: 1000" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_setitem", + "value": 69329.36108061673, + "unit": "iter/sec", + "range": "stddev: 0.0000015790715485923678", + "extra": "mean: 14.423903298880719 usec\nrounds: 25866" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_set", + "value": 71675.6141486197, + "unit": "iter/sec", + "range": "stddev: 0.0000018100032933244772", + "extra": "mean: 13.95174651627673 usec\nrounds: 27330" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_set_shared", + "value": 6768.136396797364, + "unit": "iter/sec", + "range": "stddev: 0.00014553569419283955", + "extra": "mean: 147.75115945848745 usec\nrounds: 4215" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_update", + "value": 58716.39240223086, + "unit": "iter/sec", + "range": "stddev: 0.000006407442341260111", + "extra": "mean: 17.031019091731633 usec\nrounds: 32310" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_update_nested", + "value": 44999.076821530325, + "unit": "iter/sec", + "range": "stddev: 0.0000020245746561600664", + "extra": "mean: 22.222678122177353 usec\nrounds: 25330" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_update__nested", + "value": 42950.16710970375, + "unit": "iter/sec", + "range": "stddev: 0.000002065655503295535", + "extra": "mean: 23.282796489377795 usec\nrounds: 9272" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_set_nested", + "value": 65867.78436636933, + "unit": "iter/sec", + "range": "stddev: 0.0000017656026387852348", + "extra": "mean: 15.181928610772863 usec\nrounds: 25019" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_set_nested_new", + "value": 55757.9115197739, + "unit": "iter/sec", + "range": "stddev: 0.0000019589927713597073", + "extra": "mean: 17.934674609276954 usec\nrounds: 23068" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_select", + "value": 34717.67778072766, + "unit": "iter/sec", + "range": "stddev: 0.0000028601684328778086", + "extra": "mean: 28.803769834948927 usec\nrounds: 13680" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_select_nested", + "value": 24002.4014737869, + "unit": "iter/sec", + "range": "stddev: 0.000001455402895868657", + "extra": "mean: 41.662497858479 usec\nrounds: 16600" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_exclude_nested", + "value": 16937.617934257174, + "unit": "iter/sec", + "range": "stddev: 0.0000017794398935254493", + "extra": "mean: 59.040179314556994 usec\nrounds: 11929" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_empty[True]", + "value": 3750.7269645727165, + "unit": "iter/sec", + "range": "stddev: 0.000004081811633786086", + "extra": "mean: 266.6149814277191 usec\nrounds: 3232" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_empty[False]", + "value": 1235370.3040683493, + "unit": "iter/sec", + "range": "stddev: 4.381313348959921e-8", + "extra": "mean: 809.4738854469607 nsec\nrounds: 115341" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_to", + "value": 18504.028535364927, + "unit": "iter/sec", + "range": "stddev: 0.000014179245361419654", + "extra": "mean: 54.04228587784539 usec\nrounds: 7" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_to_nonblocking", + "value": 22617.392616601912, + "unit": "iter/sec", + "range": "stddev: 0.000002048762960582614", + "extra": "mean: 44.213761371678494 usec\nrounds: 11415" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_unbind_speed", + "value": 4396.017344589423, + "unit": "iter/sec", + "range": "stddev: 0.000004118065245198175", + "extra": "mean: 227.4786293167816 usec\nrounds: 920" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_unbind_speed_stack0", + "value": 4467.46164156062, + "unit": "iter/sec", + "range": "stddev: 0.000004183779631140832", + "extra": "mean: 223.84075795906995 usec\nrounds: 3557" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_unbind_speed_stack1", + "value": 1710.5504298170033, + "unit": "iter/sec", + "range": "stddev: 0.000008772333745973442", + "extra": "mean: 584.6071431562418 usec\nrounds: 468" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_split", + "value": 645.4816044945027, + "unit": "iter/sec", + "range": "stddev: 0.003612452952499744", + "extra": "mean: 1.549230827086284 msec\nrounds: 677" + }, + { + "name": "benchmarks/common/common_ops_test.py::test_chunk", + "value": 646.17262799964, + "unit": "iter/sec", + "range": "stddev: 0.0035516358910782746", + "extra": "mean: 1.5475740640635078 msec\nrounds: 687" + }, + { + "name": "benchmarks/common/h2d_test.py::TestConsolidate::test_consolidate[False-None]", + "value": 360.9056185878469, + "unit": "iter/sec", + "range": "stddev: 0.004859357127290775", + "extra": "mean: 2.770807514476512 msec\nrounds: 379" + }, + { + "name": "benchmarks/common/h2d_test.py::TestConsolidate::test_consolidate[default-None]", + "value": 616.5727842666379, + "unit": "iter/sec", + "range": "stddev: 0.000014508284826302606", + "extra": "mean: 1.6218685376932702 msec\nrounds: 584" + }, + { + "name": "benchmarks/common/h2d_test.py::TestConsolidate::test_consolidate[reduce-overhead-None]", + "value": 597.2791112444644, + "unit": "iter/sec", + "range": "stddev: 0.00001375261232518173", + "extra": "mean: 1.6742591213619444 msec\nrounds: 577" + }, + { + "name": "benchmarks/common/h2d_test.py::TestConsolidate::test_consolidate_njt[False-None]", + "value": 158.52850527712934, + "unit": "iter/sec", + "range": "stddev: 0.00010912465723596976", + "extra": "mean: 6.308013806424682 msec\nrounds: 155" + }, + { + "name": "benchmarks/common/h2d_test.py::TestTo::test_to[False-False-None]", + "value": 604.6498007892108, + "unit": "iter/sec", + "range": "stddev: 0.000013548414478072972", + "extra": "mean: 1.6538498792106835 msec\nrounds: 604" + }, + { + "name": "benchmarks/common/h2d_test.py::TestTo::test_to[True-False-None]", + "value": 804.7730391659667, + "unit": "iter/sec", + "range": "stddev: 0.000022081883560454528", + "extra": "mean: 1.2425863583058878 msec\nrounds: 801" + }, + { + "name": "benchmarks/common/h2d_test.py::TestTo::test_to[within-False-None]", + "value": 258.8021641264811, + "unit": "iter/sec", + "range": "stddev: 0.00004685898063383173", + "extra": "mean: 3.86395532423478 msec\nrounds: 256" + }, + { + "name": "benchmarks/common/h2d_test.py::TestTo::test_to[True-default-None]", + "value": 200.8896094515423, + "unit": "iter/sec", + "range": "stddev: 0.00010326982468792573", + "extra": "mean: 4.977858251256223 msec\nrounds: 195" + }, + { + "name": "benchmarks/common/h2d_test.py::TestTo::test_to_njt[False-False-None]", + "value": 147.2887490143131, + "unit": "iter/sec", + "range": "stddev: 0.00008418427724181626", + "extra": "mean: 6.789384842306066 msec\nrounds: 146" + }, + { + "name": "benchmarks/common/h2d_test.py::TestTo::test_to_njt[True-False-None]", + "value": 187.4629263736591, + "unit": "iter/sec", + "range": "stddev: 0.00008838083012382305", + "extra": "mean: 5.334388080589106 msec\nrounds: 186" + }, + { + "name": "benchmarks/common/h2d_test.py::TestTo::test_to_njt[within-False-None]", + "value": 84.40778560739543, + "unit": "iter/sec", + "range": "stddev: 0.00010402771639136946", + "extra": "mean: 11.847248364638826 msec\nrounds: 85" + }, + { + "name": "benchmarks/common/memmap_benchmarks_test.py::test_creation[device0]", + "value": 12462.013748056177, + "unit": "iter/sec", + "range": "stddev: 0.000013530278981794842", + "extra": "mean: 80.24385305753492 usec\nrounds: 2899" + }, + { + "name": "benchmarks/common/memmap_benchmarks_test.py::test_creation_from_tensor", + "value": 12275.729906142542, + "unit": "iter/sec", + "range": "stddev: 0.000015466177178060347", + "extra": "mean: 81.46155117828219 usec\nrounds: 7241" + }, + { + "name": "benchmarks/common/memmap_benchmarks_test.py::test_add_one[memmap_tensor0]", + "value": 155675.95897659744, + "unit": "iter/sec", + "range": "stddev: 0.0000031214532129245705", + "extra": "mean: 6.423599421348859 usec\nrounds: 25974" + }, + { + "name": "benchmarks/common/memmap_benchmarks_test.py::test_contiguous[memmap_tensor0]", + "value": 2527721.724954064, + "unit": "iter/sec", + "range": "stddev: 1.815993592176078e-7", + "extra": "mean: 395.6131682249053 nsec\nrounds: 120049" + }, + { + "name": "benchmarks/common/memmap_benchmarks_test.py::test_stack[memmap_tensor0]", + "value": 240295.9598041904, + "unit": "iter/sec", + "range": "stddev: 4.990644363641968e-7", + "extra": "mean: 4.1615348040594125 usec\nrounds: 23305" + }, + { + "name": "benchmarks/common/memmap_benchmarks_test.py::test_memmaptd_index", + "value": 4162.841681928305, + "unit": "iter/sec", + "range": "stddev: 0.00006156062355687913", + "extra": "mean: 240.220521558913 usec\nrounds: 2063" + }, + { + "name": "benchmarks/common/memmap_benchmarks_test.py::test_memmaptd_index_astensor", + "value": 3370.322362125645, + "unit": "iter/sec", + "range": "stddev: 0.00006377705503050839", + "extra": "mean: 296.70752306592567 usec\nrounds: 3208" + }, + { + "name": "benchmarks/common/memmap_benchmarks_test.py::test_memmaptd_index_op", + "value": 1774.2617922919176, + "unit": "iter/sec", + "range": "stddev: 0.00006940321188753397", + "extra": "mean: 563.6146843404894 usec\nrounds: 1698" + }, + { + "name": "benchmarks/common/memmap_benchmarks_test.py::test_serialize_model", + "value": 7.664120799393542, + "unit": "iter/sec", + "range": "stddev: 0.0007348188253250729", + "extra": "mean: 130.47811042841724 msec\nrounds: 7" + }, + { + "name": "benchmarks/common/memmap_benchmarks_test.py::test_serialize_model_pickle", + "value": 0.8251490998934677, + "unit": "iter/sec", + "range": "stddev: 0.32586946617817436", + "extra": "mean: 1.2119021885003651 sec\nrounds: 6" + }, + { + "name": "benchmarks/common/memmap_benchmarks_test.py::test_serialize_weights", + "value": 7.667260865865399, + "unit": "iter/sec", + "range": "stddev: 0.0009408717665713112", + "extra": "mean: 130.42467414301686 msec\nrounds: 7" + }, + { + "name": "benchmarks/common/memmap_benchmarks_test.py::test_serialize_weights_returnearly", + "value": 24.052894174035472, + "unit": "iter/sec", + "range": "stddev: 0.004107013701484695", + "extra": "mean: 41.57503844503986 msec\nrounds: 27" + }, + { + "name": "benchmarks/common/memmap_benchmarks_test.py::test_serialize_weights_pickle", + "value": 0.8200734271339326, + "unit": "iter/sec", + "range": "stddev: 0.31830197626884016", + "extra": "mean: 1.2194030033321421 sec\nrounds: 6" + }, + { + "name": "benchmarks/common/pytree_benchmarks_test.py::test_reshape_pytree", + "value": 45070.74729667241, + "unit": "iter/sec", + "range": "stddev: 0.0000011214098322859942", + "extra": "mean: 22.187340125905354 usec\nrounds: 12777" + }, + { + "name": "benchmarks/common/pytree_benchmarks_test.py::test_reshape_td", + "value": 38119.34102087772, + "unit": "iter/sec", + "range": "stddev: 0.0000012185511283225603", + "extra": "mean: 26.233402079335693 usec\nrounds: 9538" + }, + { + "name": "benchmarks/common/pytree_benchmarks_test.py::test_view_pytree", + "value": 45856.232425387745, + "unit": "iter/sec", + "range": "stddev: 0.0000010515351255006118", + "extra": "mean: 21.807286536832063 usec\nrounds: 23202" + }, + { + "name": "benchmarks/common/pytree_benchmarks_test.py::test_view_td", + "value": 34450.15269439509, + "unit": "iter/sec", + "range": "stddev: 0.0000014205779750232337", + "extra": "mean: 29.027447537633012 usec\nrounds: 15127" + }, + { + "name": "benchmarks/common/pytree_benchmarks_test.py::test_unbind_pytree", + "value": 35900.93449728897, + "unit": "iter/sec", + "range": "stddev: 0.000001352554579685832", + "extra": "mean: 27.854428136836223 usec\nrounds: 14510" + }, + { + "name": "benchmarks/common/pytree_benchmarks_test.py::test_unbind_td", + "value": 28416.77124965158, + "unit": "iter/sec", + "range": "stddev: 0.000005253799038015723", + "extra": "mean: 35.19048632283518 usec\nrounds: 15572" + }, + { + "name": "benchmarks/common/pytree_benchmarks_test.py::test_split_pytree", + "value": 33570.051860448315, + "unit": "iter/sec", + "range": "stddev: 0.000001492669870756856", + "extra": "mean: 29.78845561981939 usec\nrounds: 13897" + }, + { + "name": "benchmarks/common/pytree_benchmarks_test.py::test_split_td", + "value": 26502.84605531591, + "unit": "iter/sec", + "range": "stddev: 0.00001463775388772617", + "extra": "mean: 37.73179672525853 usec\nrounds: 13013" + }, + { + "name": "benchmarks/common/pytree_benchmarks_test.py::test_add_pytree", + "value": 29905.54858911461, + "unit": "iter/sec", + "range": "stddev: 0.000001671299200366585", + "extra": "mean: 33.43861079893355 usec\nrounds: 10428" + }, + { + "name": "benchmarks/common/pytree_benchmarks_test.py::test_add_td", + "value": 22776.30405877428, + "unit": "iter/sec", + "range": "stddev: 0.0000022757583907315755", + "extra": "mean: 43.90527968978192 usec\nrounds: 9654" + }, + { + "name": "benchmarks/compile/compile_td_test.py::test_compile_add_one_nested[tensordict-compile]", + "value": 8284.697503711086, + "unit": "iter/sec", + "range": "stddev: 0.000004307771017617054", + "extra": "mean: 120.70446742950547 usec\nrounds: 2381" + }, + { + "name": "benchmarks/compile/compile_td_test.py::test_compile_add_one_nested[tensordict-eager]", + "value": 8131.166776835762, + "unit": "iter/sec", + "range": "stddev: 0.000003922658358563878", + "extra": "mean: 122.98358002554085 usec\nrounds: 7223" + }, + { + "name": "benchmarks/compile/compile_td_test.py::test_compile_add_one_nested[pytree-compile]", + "value": 10582.038582129977, + "unit": "iter/sec", + "range": "stddev: 0.0000033276683765250427", + "extra": "mean: 94.49974995259541 usec\nrounds: 3175" + }, + { + "name": "benchmarks/compile/compile_td_test.py::test_compile_add_one_nested[pytree-eager]", + "value": 6840.181960871412, + "unit": "iter/sec", + "range": "stddev: 0.000009374456814923927", + "extra": "mean: 146.1949412633175 usec\nrounds: 6266" + }, + { + "name": "benchmarks/compile/compile_td_test.py::test_compile_copy_nested[tensordict-compile]", + "value": 43700.90902779176, + "unit": "iter/sec", + "range": "stddev: 0.000001381979790749592", + "extra": "mean: 22.882819196370637 usec\nrounds: 31929" + }, + { + "name": "benchmarks/compile/compile_td_test.py::test_compile_copy_nested[tensordict-eager]", + "value": 37287.147992884195, + "unit": "iter/sec", + "range": "stddev: 0.0000011676387854180538", + "extra": "mean: 26.81889213384832 usec\nrounds: 31857" + }, + { + "name": "benchmarks/compile/compile_td_test.py::test_compile_copy_nested[pytree-compile]", + "value": 15576.89880653467, + "unit": "iter/sec", + "range": "stddev: 0.0000022031377905304834", + "extra": "mean: 64.19763089046259 usec\nrounds: 10731" + }, + { + "name": "benchmarks/compile/compile_td_test.py::test_compile_copy_nested[pytree-eager]", + "value": 20320.09127060297, + "unit": "iter/sec", + "range": "stddev: 0.000001616184177763492", + "extra": "mean: 49.21237737975605 usec\nrounds: 17569" + }, + { + "name": "benchmarks/compile/compile_td_test.py::test_compile_add_one_flat[tensordict-compile]", + "value": 7042.527924602868, + "unit": "iter/sec", + "range": "stddev: 0.000004268556690584341", + "extra": "mean: 141.99446714389717 usec\nrounds: 1706" + }, + { + "name": "benchmarks/compile/compile_td_test.py::test_compile_add_one_flat[tensordict-eager]", + "value": 4932.219412828109, + "unit": "iter/sec", + "range": "stddev: 0.000004367121672991417", + "extra": "mean: 202.74848223481712 usec\nrounds: 4753" + }, + { + "name": "benchmarks/compile/compile_td_test.py::test_compile_add_one_flat[tensorclass-compile]", + "value": 10433.37523091158, + "unit": "iter/sec", + "range": "stddev: 0.0000033341813769166192", + "extra": "mean: 95.84626047352735 usec\nrounds: 3494" + }, + { + "name": "benchmarks/compile/compile_td_test.py::test_compile_add_one_flat[tensorclass-eager]", + "value": 19977.841098005072, + "unit": "iter/sec", + "range": "stddev: 0.000002450100710992213", + "extra": "mean: 50.055458700182434 usec\nrounds: 16647" + }, + { + "name": "benchmarks/compile/compile_td_test.py::test_compile_add_one_flat[pytree-compile]", + "value": 7435.699271471523, + "unit": "iter/sec", + "range": "stddev: 0.0000037151454741766214", + "extra": "mean: 134.48634264119454 usec\nrounds: 1763" + }, + { + "name": "benchmarks/compile/compile_td_test.py::test_compile_add_one_flat[pytree-eager]", + "value": 2149.5001264478415, + "unit": "iter/sec", + "range": "stddev: 0.0000070327049739750405", + "extra": "mean: 465.22444343957824 usec\nrounds: 2093" + }, + { + "name": "benchmarks/compile/compile_td_test.py::test_compile_add_self_flat[tensordict-eager]", + "value": 4105.510295594302, + "unit": "iter/sec", + "range": "stddev: 0.000005946496026078204", + "extra": "mean: 243.57508031903325 usec\nrounds: 3873" + }, + { + "name": "benchmarks/compile/compile_td_test.py::test_compile_add_self_flat[tensordict-compile]", + "value": 7140.883406562312, + "unit": "iter/sec", + "range": "stddev: 0.000004154226636075559", + "extra": "mean: 140.03869592395563 usec\nrounds: 1720" + }, + { + "name": "benchmarks/compile/compile_td_test.py::test_compile_add_self_flat[tensorclass-eager]", + "value": 16524.71841875902, + "unit": "iter/sec", + "range": "stddev: 0.0000026423741222881596", + "extra": "mean: 60.515403328433734 usec\nrounds: 13523" + }, + { + "name": "benchmarks/compile/compile_td_test.py::test_compile_add_self_flat[tensorclass-compile]", + "value": 10435.346142112468, + "unit": "iter/sec", + "range": "stddev: 0.000003608945855843771", + "extra": "mean: 95.8281581062692 usec\nrounds: 3371" + }, + { + "name": "benchmarks/compile/compile_td_test.py::test_compile_add_self_flat[pytree-eager]", + "value": 2532.8722261371254, + "unit": "iter/sec", + "range": "stddev: 0.00000582099641705635", + "extra": "mean: 394.8087036056677 usec\nrounds: 2500" + }, + { + "name": "benchmarks/compile/compile_td_test.py::test_compile_add_self_flat[pytree-compile]", + "value": 7513.499079168104, + "unit": "iter/sec", + "range": "stddev: 0.000004310277604091702", + "extra": "mean: 133.09378086870282 usec\nrounds: 1839" + }, + { + "name": "benchmarks/compile/compile_td_test.py::test_compile_copy_flat[tensordict-compile]", + "value": 54513.919579176196, + "unit": "iter/sec", + "range": "stddev: 0.0000011947313675926555", + "extra": "mean: 18.343938717295803 usec\nrounds: 36192" + }, + { + "name": "benchmarks/compile/compile_td_test.py::test_compile_copy_flat[tensordict-eager]", + "value": 37352.308526190274, + "unit": "iter/sec", + "range": "stddev: 0.0000010856680404051866", + "extra": "mean: 26.772106985002846 usec\nrounds: 33378" + }, + { + "name": "benchmarks/compile/compile_td_test.py::test_compile_copy_flat[pytree-compile]", + "value": 14485.872746197181, + "unit": "iter/sec", + "range": "stddev: 0.000002154853288059432", + "extra": "mean: 69.03277541648426 usec\nrounds: 13362" + }, + { + "name": "benchmarks/compile/compile_td_test.py::test_compile_copy_flat[pytree-eager]", + "value": 19608.652009477766, + "unit": "iter/sec", + "range": "stddev: 0.0000016348905651813466", + "extra": "mean: 50.99789621013488 usec\nrounds: 17526" + }, + { + "name": "benchmarks/compile/compile_td_test.py::test_compile_assign_and_add[tensordict-compile]", + "value": 2274.5127619788573, + "unit": "iter/sec", + "range": "stddev: 0.0006554244958825935", + "extra": "mean: 439.6546006319113 usec\nrounds: 5" + }, + { + "name": "benchmarks/compile/compile_td_test.py::test_compile_assign_and_add[tensordict-eager]", + "value": 385.5384696440321, + "unit": "iter/sec", + "range": "stddev: 0.00002973572367775201", + "extra": "mean: 2.5937748856120653 msec\nrounds: 376" + }, + { + "name": "benchmarks/compile/compile_td_test.py::test_compile_assign_and_add[pytree-compile]", + "value": 2309.2618946480457, + "unit": "iter/sec", + "range": "stddev: 0.0006519307063051396", + "extra": "mean: 433.03880011080764 usec\nrounds: 5" + }, + { + "name": "benchmarks/compile/compile_td_test.py::test_compile_assign_and_add[pytree-eager]", + "value": 384.60747291963173, + "unit": "iter/sec", + "range": "stddev: 0.000022995371224398395", + "extra": "mean: 2.6000534841634804 msec\nrounds: 378" + }, + { + "name": "benchmarks/compile/compile_td_test.py::test_compile_indexing[tensor-tensordict-compile]", + "value": 8934.190569465673, + "unit": "iter/sec", + "range": "stddev: 0.000005463570024814525", + "extra": "mean: 111.92955782896482 usec\nrounds: 7710" + }, + { + "name": "benchmarks/compile/compile_td_test.py::test_compile_indexing[tensor-tensordict-eager]", + "value": 12824.873979141223, + "unit": "iter/sec", + "range": "stddev: 0.000013158626047977655", + "extra": "mean: 77.97347573367438 usec\nrounds: 11347" + }, + { + "name": "benchmarks/compile/compile_td_test.py::test_compile_indexing[tensor-tensorclass-compile]", + "value": 9768.687975665245, + "unit": "iter/sec", + "range": "stddev: 0.000005171560232750016", + "extra": "mean: 102.36789244278224 usec\nrounds: 8655" + }, + { + "name": "benchmarks/compile/compile_td_test.py::test_compile_indexing[tensor-tensorclass-eager]", + "value": 14668.366831793353, + "unit": "iter/sec", + "range": "stddev: 0.0000033272047600321555", + "extra": "mean: 68.17391543771066 usec\nrounds: 13174" + }, + { + "name": "benchmarks/compile/compile_td_test.py::test_compile_indexing[tensor-pytree-compile]", + "value": 9275.874482846499, + "unit": "iter/sec", + "range": "stddev: 0.0000041321847943907834", + "extra": "mean: 107.80654717237277 usec\nrounds: 8942" + }, + { + "name": "benchmarks/compile/compile_td_test.py::test_compile_indexing[tensor-pytree-eager]", + "value": 14926.190177231294, + "unit": "iter/sec", + "range": "stddev: 0.0000028404526490997553", + "extra": "mean: 66.99633249517481 usec\nrounds: 12842" + }, + { + "name": "benchmarks/compile/compile_td_test.py::test_compile_indexing[slice-tensordict-compile]", + "value": 10149.166348680274, + "unit": "iter/sec", + "range": "stddev: 0.0000031797800859569017", + "extra": "mean: 98.53026008683294 usec\nrounds: 3980" + }, + { + "name": "benchmarks/compile/compile_td_test.py::test_compile_indexing[slice-tensordict-eager]", + "value": 58140.69092987962, + "unit": "iter/sec", + "range": "stddev: 0.000008753979925863043", + "extra": "mean: 17.199658002104698 usec\nrounds: 43384" + }, + { + "name": "benchmarks/compile/compile_td_test.py::test_compile_indexing[slice-tensorclass-compile]", + "value": 10573.513994291507, + "unit": "iter/sec", + "range": "stddev: 0.000004218111239578436", + "extra": "mean: 94.57593762488857 usec\nrounds: 4249" + }, + { + "name": "benchmarks/compile/compile_td_test.py::test_compile_indexing[slice-tensorclass-eager]", + "value": 64727.85771574291, + "unit": "iter/sec", + "range": "stddev: 9.705754430059102e-7", + "extra": "mean: 15.44929857545375 usec\nrounds: 46577" + }, + { + "name": "benchmarks/compile/compile_td_test.py::test_compile_indexing[slice-pytree-compile]", + "value": 10597.446435097718, + "unit": "iter/sec", + "range": "stddev: 0.00000332461726063794", + "extra": "mean: 94.36235475445261 usec\nrounds: 9406" + }, + { + "name": "benchmarks/compile/compile_td_test.py::test_compile_indexing[slice-pytree-eager]", + "value": 65699.59453526152, + "unit": "iter/sec", + "range": "stddev: 0.0000010245448288297703", + "extra": "mean: 15.220794086686361 usec\nrounds: 49237" + }, + { + "name": "benchmarks/compile/compile_td_test.py::test_compile_indexing[int-tensordict-compile]", + "value": 10028.577841245818, + "unit": "iter/sec", + "range": "stddev: 0.000003403860362386267", + "extra": "mean: 99.71503595327064 usec\nrounds: 9096" + }, + { + "name": "benchmarks/compile/compile_td_test.py::test_compile_indexing[int-tensordict-eager]", + "value": 59571.083243354515, + "unit": "iter/sec", + "range": "stddev: 0.000008907859374762302", + "extra": "mean: 16.786668053607293 usec\nrounds: 47170" + }, + { + "name": "benchmarks/compile/compile_td_test.py::test_compile_indexing[int-tensorclass-compile]", + "value": 10582.046692276463, + "unit": "iter/sec", + "range": "stddev: 0.0000033317913113526494", + "extra": "mean: 94.49967752739853 usec\nrounds: 9312" + }, + { + "name": "benchmarks/compile/compile_td_test.py::test_compile_indexing[int-tensorclass-eager]", + "value": 65250.524345294754, + "unit": "iter/sec", + "range": "stddev: 0.0000012935772549741667", + "extra": "mean: 15.32554734285611 usec\nrounds: 50710" + }, + { + "name": "benchmarks/compile/compile_td_test.py::test_compile_indexing[int-pytree-compile]", + "value": 10561.052041508534, + "unit": "iter/sec", + "range": "stddev: 0.0000036543254614532294", + "extra": "mean: 94.68753643762564 usec\nrounds: 9569" + }, + { + "name": "benchmarks/compile/compile_td_test.py::test_compile_indexing[int-pytree-eager]", + "value": 66351.80059959929, + "unit": "iter/sec", + "range": "stddev: 9.668819742542283e-7", + "extra": "mean: 15.071181052561204 usec\nrounds: 49068" + }, + { + "name": "benchmarks/compile/tensordict_nn_test.py::test_mod_add[eager]", + "value": 27840.491797417155, + "unit": "iter/sec", + "range": "stddev: 0.000001956308233287679", + "extra": "mean: 35.9189057174907 usec\nrounds: 19535" + }, + { + "name": "benchmarks/compile/tensordict_nn_test.py::test_mod_add[compile]", + "value": 11845.486501872501, + "unit": "iter/sec", + "range": "stddev: 0.000004253187020134827", + "extra": "mean: 84.42034017276731 usec\nrounds: 7811" + }, + { + "name": "benchmarks/compile/tensordict_nn_test.py::test_mod_add[compile-overhead]", + "value": 5538.791450279951, + "unit": "iter/sec", + "range": "stddev: 0.0000795421292559809", + "extra": "mean: 180.54480096907355 usec\nrounds: 5" + }, + { + "name": "benchmarks/compile/tensordict_nn_test.py::test_mod_wrap[eager]", + "value": 4127.74716311318, + "unit": "iter/sec", + "range": "stddev: 0.00000672587681077494", + "extra": "mean: 242.26290043545012 usec\nrounds: 3725" + }, + { + "name": "benchmarks/compile/tensordict_nn_test.py::test_mod_wrap[compile]", + "value": 3577.4398652619293, + "unit": "iter/sec", + "range": "stddev: 0.00002156134248049013", + "extra": "mean: 279.5295064804068 usec\nrounds: 2928" + }, + { + "name": "benchmarks/compile/tensordict_nn_test.py::test_mod_wrap[compile-overhead]", + "value": 261.3152254746158, + "unit": "iter/sec", + "range": "stddev: 0.001791303631589329", + "extra": "mean: 3.826795771979005 msec\nrounds: 1311" + }, + { + "name": "benchmarks/compile/tensordict_nn_test.py::test_mod_wrap_and_backward[eager]", + "value": 744.5941211610199, + "unit": "iter/sec", + "range": "stddev: 0.000020447355608933202", + "extra": "mean: 1.3430135580989204 msec\nrounds: 722" + }, + { + "name": "benchmarks/compile/tensordict_nn_test.py::test_mod_wrap_and_backward[compile]", + "value": 797.4471401242463, + "unit": "iter/sec", + "range": "stddev: 0.00002162368332248578", + "extra": "mean: 1.2540016130024556 msec\nrounds: 571" + }, + { + "name": "benchmarks/compile/tensordict_nn_test.py::test_mod_wrap_and_backward[compile-overhead]", + "value": 1001.1459112155761, + "unit": "iter/sec", + "range": "stddev: 0.00023230376142026476", + "extra": "mean: 998.8554003939498 usec\nrounds: 5" + }, + { + "name": "benchmarks/compile/tensordict_nn_test.py::test_seq_add[eager]", + "value": 9194.01331916701, + "unit": "iter/sec", + "range": "stddev: 0.000003844970377613222", + "extra": "mean: 108.76642933671553 usec\nrounds: 8005" + }, + { + "name": "benchmarks/compile/tensordict_nn_test.py::test_seq_add[compile]", + "value": 10883.284188230611, + "unit": "iter/sec", + "range": "stddev: 0.000004106679058753933", + "extra": "mean: 91.88402900306681 usec\nrounds: 9311" + }, + { + "name": "benchmarks/compile/tensordict_nn_test.py::test_seq_add[compile-overhead]", + "value": 8011.511223376698, + "unit": "iter/sec", + "range": "stddev: 0.0000037880326919224736", + "extra": "mean: 124.820395568081 usec\nrounds: 3064" + }, + { + "name": "benchmarks/compile/tensordict_nn_test.py::test_seq_wrap[eager]", + "value": 2433.9216831907133, + "unit": "iter/sec", + "range": "stddev: 0.000008066050350223503", + "extra": "mean: 410.8595633566422 usec\nrounds: 2265" + }, + { + "name": "benchmarks/compile/tensordict_nn_test.py::test_seq_wrap[compile]", + "value": 3373.2045278194837, + "unit": "iter/sec", + "range": "stddev: 0.000005705720144287872", + "extra": "mean: 296.45400738461086 usec\nrounds: 3143" + }, + { + "name": "benchmarks/compile/tensordict_nn_test.py::test_seq_wrap[compile-overhead]", + "value": 4522.4504548450295, + "unit": "iter/sec", + "range": "stddev: 0.000005163164283719853", + "extra": "mean: 221.11906144348612 usec\nrounds: 2083" + }, + { + "name": "benchmarks/compile/tensordict_nn_test.py::test_func_call_runtime[False-eager]", + "value": 1379.5855694364302, + "unit": "iter/sec", + "range": "stddev: 0.00001108640496637255", + "extra": "mean: 724.8553639253465 usec\nrounds: 1341" + }, + { + "name": "benchmarks/compile/tensordict_nn_test.py::test_func_call_runtime[False-compile]", + "value": 1369.8937050607688, + "unit": "iter/sec", + "range": "stddev: 0.000012311773622545497", + "extra": "mean: 729.9836449395466 usec\nrounds: 1315" + }, + { + "name": "benchmarks/compile/tensordict_nn_test.py::test_func_call_runtime[False-compile-overhead]", + "value": 2849.2064164040617, + "unit": "iter/sec", + "range": "stddev: 0.000006639413598293264", + "extra": "mean: 350.9749220844744 usec\nrounds: 1450" + }, + { + "name": "benchmarks/compile/tensordict_nn_test.py::test_func_call_runtime[True-eager]", + "value": 1136.6915095330603, + "unit": "iter/sec", + "range": "stddev: 0.000012859281512673915", + "extra": "mean: 879.7461682552625 usec\nrounds: 1129" + }, + { + "name": "benchmarks/compile/tensordict_nn_test.py::test_func_call_runtime[True-compile]", + "value": 1335.0744557130645, + "unit": "iter/sec", + "range": "stddev: 0.000011086662669218268", + "extra": "mean: 749.0218959105911 usec\nrounds: 1278" + }, + { + "name": "benchmarks/compile/tensordict_nn_test.py::test_func_call_runtime[True-compile-overhead]", + "value": 2682.8205764044105, + "unit": "iter/sec", + "range": "stddev: 0.000007021213585607068", + "extra": "mean: 372.74203455686455 usec\nrounds: 1332" + }, + { + "name": "benchmarks/compile/tensordict_nn_test.py::test_func_call_cm_runtime[False-eager]", + "value": 1394.9400473852688, + "unit": "iter/sec", + "range": "stddev: 0.000012673334754723853", + "extra": "mean: 716.876687191281 usec\nrounds: 1365" + }, + { + "name": "benchmarks/compile/tensordict_nn_test.py::test_func_call_cm_runtime[False-compile]", + "value": 1369.0745741926862, + "unit": "iter/sec", + "range": "stddev: 0.000011288977455047147", + "extra": "mean: 730.4204013792881 usec\nrounds: 1313" + }, + { + "name": "benchmarks/compile/tensordict_nn_test.py::test_func_call_cm_runtime[False-compile-overhead]", + "value": 2732.2053337557904, + "unit": "iter/sec", + "range": "stddev: 0.000009338009432384208", + "extra": "mean: 366.0047023718247 usec\nrounds: 1401" + }, + { + "name": "benchmarks/compile/tensordict_nn_test.py::test_func_call_cm_runtime[True-eager]", + "value": 1016.7147594449032, + "unit": "iter/sec", + "range": "stddev: 0.000022336963384530547", + "extra": "mean: 983.5600306874379 usec\nrounds: 976" + }, + { + "name": "benchmarks/compile/tensordict_nn_test.py::test_func_call_cm_runtime[True-compile]", + "value": 1286.607939709884, + "unit": "iter/sec", + "range": "stddev: 0.000011966200575708427", + "extra": "mean: 777.2375477688169 usec\nrounds: 1225" + }, + { + "name": "benchmarks/compile/tensordict_nn_test.py::test_func_call_cm_runtime[True-compile-overhead]", + "value": 2503.660358709031, + "unit": "iter/sec", + "range": "stddev: 0.000007097021806692011", + "extra": "mean: 399.41519883936365 usec\nrounds: 1287" + }, + { + "name": "benchmarks/compile/tensordict_nn_test.py::test_vmap_func_call_cm_runtime[eager]", + "value": 486.631384526539, + "unit": "iter/sec", + "range": "stddev: 0.0000762738886714152", + "extra": "mean: 2.0549434989133215 msec\nrounds: 475" + }, + { + "name": "benchmarks/compile/tensordict_nn_test.py::test_vmap_func_call_cm_runtime[compile]", + "value": 1259.6507299418554, + "unit": "iter/sec", + "range": "stddev: 0.000011557454362567655", + "extra": "mean: 793.8708534278857 usec\nrounds: 1228" + }, + { + "name": "benchmarks/compile/tensordict_nn_test.py::test_vmap_func_call_cm_runtime[compile-overhead]", + "value": 2489.1147153933366, + "unit": "iter/sec", + "range": "stddev: 0.000006939683511525165", + "extra": "mean: 401.74926202305517 usec\nrounds: 1206" + }, + { + "name": "benchmarks/distributed/distributed_benchmark_test.py::test_distributed", + "value": 8590.123255954055, + "unit": "iter/sec", + "range": "stddev: 0.00007465190130020435", + "extra": "mean: 116.41276500973045 usec\nrounds: 4060" + }, + { + "name": "benchmarks/nn/functional_benchmarks_test.py::test_tdmodule", + "value": 51065.45523810768, + "unit": "iter/sec", + "range": "stddev: 0.000020119100191295783", + "extra": "mean: 19.58270998147782 usec\nrounds: 1000" + }, + { + "name": "benchmarks/nn/functional_benchmarks_test.py::test_tdmodule_dispatch", + "value": 28904.617046010004, + "unit": "iter/sec", + "range": "stddev: 0.0000015951118244076294", + "extra": "mean: 34.59654900143505 usec\nrounds: 1000" + }, + { + "name": "benchmarks/nn/functional_benchmarks_test.py::test_tdseq", + "value": 52602.0995416812, + "unit": "iter/sec", + "range": "stddev: 9.022521209569831e-7", + "extra": "mean: 19.010648029507138 usec\nrounds: 1000" + }, + { + "name": "benchmarks/nn/functional_benchmarks_test.py::test_tdseq_dispatch", + "value": 27541.43553071735, + "unit": "iter/sec", + "range": "stddev: 0.000001540375688652065", + "extra": "mean: 36.308928010839736 usec\nrounds: 1000" + }, + { + "name": "benchmarks/nn/functional_benchmarks_test.py::test_instantiation_functorch", + "value": 675.0621480236714, + "unit": "iter/sec", + "range": "stddev: 0.000026129390843036256", + "extra": "mean: 1.4813450923409415 msec\nrounds: 585" + }, + { + "name": "benchmarks/nn/functional_benchmarks_test.py::test_exec_functorch", + "value": 7138.7812748903, + "unit": "iter/sec", + "range": "stddev: 0.0000037754330986789108", + "extra": "mean: 140.07993262342484 usec\nrounds: 3650" + }, + { + "name": "benchmarks/nn/functional_benchmarks_test.py::test_exec_functional_call", + "value": 7609.426299264, + "unit": "iter/sec", + "range": "stddev: 0.000004347834667362414", + "extra": "mean: 131.41595183026112 usec\nrounds: 5292" + }, + { + "name": "benchmarks/nn/functional_benchmarks_test.py::test_exec_td_decorator", + "value": 5626.679884229375, + "unit": "iter/sec", + "range": "stddev: 0.000008003706503008494", + "extra": "mean: 177.72470099157934 usec\nrounds: 4007" + }, + { + "name": "benchmarks/nn/functional_benchmarks_test.py::test_vmap_mlp_speed_decorator[True-True]", + "value": 1480.9651544018634, + "unit": "iter/sec", + "range": "stddev: 0.00001285861189295839", + "extra": "mean: 675.2353335442812 usec\nrounds: 1400" + }, + { + "name": "benchmarks/nn/functional_benchmarks_test.py::test_vmap_mlp_speed_decorator[True-False]", + "value": 1488.3711223856517, + "unit": "iter/sec", + "range": "stddev: 0.000012912097834789523", + "extra": "mean: 671.8754381616455 usec\nrounds: 1456" + }, + { + "name": "benchmarks/nn/functional_benchmarks_test.py::test_vmap_mlp_speed_decorator[False-True]", + "value": 1712.032959215743, + "unit": "iter/sec", + "range": "stddev: 0.000011715922622640583", + "extra": "mean: 584.1009044931502 usec\nrounds: 1686" + }, + { + "name": "benchmarks/nn/functional_benchmarks_test.py::test_vmap_mlp_speed_decorator[False-False]", + "value": 1705.0194016937364, + "unit": "iter/sec", + "range": "stddev: 0.00001200022823522155", + "extra": "mean: 586.5035899337083 usec\nrounds: 1402" + }, + { + "name": "benchmarks/nn/functional_benchmarks_test.py::test_vmap_transformer_speed_decorator[True-True]", + "value": 52.78746788817228, + "unit": "iter/sec", + "range": "stddev: 0.00004744133494559294", + "extra": "mean: 18.943890283171985 msec\nrounds: 53" + }, + { + "name": "benchmarks/nn/functional_benchmarks_test.py::test_vmap_transformer_speed_decorator[True-False]", + "value": 52.624876618364766, + "unit": "iter/sec", + "range": "stddev: 0.00012943246866133624", + "extra": "mean: 19.00241984892417 msec\nrounds: 53" + }, + { + "name": "benchmarks/nn/functional_benchmarks_test.py::test_vmap_transformer_speed_decorator[False-True]", + "value": 53.11644924512497, + "unit": "iter/sec", + "range": "stddev: 0.00025675570309813516", + "extra": "mean: 18.82655964793769 msec\nrounds: 54" + }, + { + "name": "benchmarks/nn/functional_benchmarks_test.py::test_vmap_transformer_speed_decorator[False-False]", + "value": 53.20071066055675, + "unit": "iter/sec", + "range": "stddev: 0.0000572322826183248", + "extra": "mean: 18.796741389046982 msec\nrounds: 54" + }, + { + "name": "benchmarks/nn/functional_benchmarks_test.py::test_to_module_speed[True]", + "value": 1071.949533173018, + "unit": "iter/sec", + "range": "stddev: 0.000013261224343263914", + "extra": "mean: 932.8797383212211 usec\nrounds: 982" + }, + { + "name": "benchmarks/nn/functional_benchmarks_test.py::test_to_module_speed[False]", + "value": 1074.1865479675032, + "unit": "iter/sec", + "range": "stddev: 0.000019071991778275747", + "extra": "mean: 930.9369977608885 usec\nrounds: 868" + }, + { + "name": "benchmarks/tensorclass/test_tensorclass_speed.py::test_tc_init", + "value": 27563.676958528024, + "unit": "iter/sec", + "range": "stddev: 0.000001519778861390857", + "extra": "mean: 36.279629945764775 usec\nrounds: 5383" + }, + { + "name": "benchmarks/tensorclass/test_tensorclass_speed.py::test_tc_init_nested", + "value": 13985.089646590755, + "unit": "iter/sec", + "range": "stddev: 0.0000026395525300280788", + "extra": "mean: 71.5047257665436 usec\nrounds: 8584" + }, + { + "name": "benchmarks/tensorclass/test_tensorclass_speed.py::test_tc_first_layer_tensor", + "value": 1444893.9624697994, + "unit": "iter/sec", + "range": "stddev: 5.2959798358308225e-8", + "extra": "mean: 692.0923098679648 nsec\nrounds: 195313" + }, + { + "name": "benchmarks/tensorclass/test_tensorclass_speed.py::test_tc_first_layer_nontensor", + "value": 445729.2780610773, + "unit": "iter/sec", + "range": "stddev: 2.4531871001996166e-7", + "extra": "mean: 2.2435142792279676 usec\nrounds: 111235" + }, + { + "name": "benchmarks/tensorclass/test_tensorclass_speed.py::test_tc_second_layer_tensor", + "value": 721792.6405074416, + "unit": "iter/sec", + "range": "stddev: 1.26569588609402e-7", + "extra": "mean: 1.3854394515535242 usec\nrounds: 173011" + }, + { + "name": "benchmarks/tensorclass/test_tensorclass_speed.py::test_tc_second_layer_nontensor", + "value": 335913.7846151051, + "unit": "iter/sec", + "range": "stddev: 2.9758628282170906e-7", + "extra": "mean: 2.9769543430491083 usec\nrounds: 139665" + }, + { + "name": "benchmarks/tensorclass/test_torch_functions.py::test_unbind", + "value": 149.57893420220165, + "unit": "iter/sec", + "range": "stddev: 0.0001543738306845643", + "extra": "mean: 6.685433382271559 msec\nrounds: 68" + }, + { + "name": "benchmarks/tensorclass/test_torch_functions.py::test_full_like", + "value": 109.98050151633848, + "unit": "iter/sec", + "range": "stddev: 0.00014158986069908854", + "extra": "mean: 9.09252082153346 msec\nrounds: 56" + }, + { + "name": "benchmarks/tensorclass/test_torch_functions.py::test_zeros_like", + "value": 138.6554468370998, + "unit": "iter/sec", + "range": "stddev: 0.0018331115236168679", + "extra": "mean: 7.2121220104310515 msec\nrounds: 196" + }, + { + "name": "benchmarks/tensorclass/test_torch_functions.py::test_ones_like", + "value": 231.19795518573002, + "unit": "iter/sec", + "range": "stddev: 0.00011102717666244442", + "extra": "mean: 4.3252977700285555 msec\nrounds: 200" + }, + { + "name": "benchmarks/tensorclass/test_torch_functions.py::test_clone", + "value": 158.49153664357624, + "unit": "iter/sec", + "range": "stddev: 0.00004479255106595677", + "extra": "mean: 6.309485169853898 msec\nrounds: 159" + }, + { + "name": "benchmarks/tensorclass/test_torch_functions.py::test_squeeze", + "value": 109461.2300306185, + "unit": "iter/sec", + "range": "stddev: 7.680621479565565e-7", + "extra": "mean: 9.135654694546004 usec\nrounds: 14961" + }, + { + "name": "benchmarks/tensorclass/test_torch_functions.py::test_unsqueeze", + "value": 14668.925482684685, + "unit": "iter/sec", + "range": "stddev: 0.000002831985838224211", + "extra": "mean: 68.17131910448437 usec\nrounds: 5634" + }, + { + "name": "benchmarks/tensorclass/test_torch_functions.py::test_split", + "value": 6454.518863757201, + "unit": "iter/sec", + "range": "stddev: 0.000018226573110725443", + "extra": "mean: 154.93021573073474 usec\nrounds: 3662" + }, + { + "name": "benchmarks/tensorclass/test_torch_functions.py::test_permute", + "value": 5870.425900714052, + "unit": "iter/sec", + "range": "stddev: 0.000005286774319803518", + "extra": "mean: 170.3453917846684 usec\nrounds: 2075" + }, + { + "name": "benchmarks/tensorclass/test_torch_functions.py::test_stack", + "value": 19.8853670035324, + "unit": "iter/sec", + "range": "stddev: 0.00017503299634836496", + "extra": "mean: 50.2882345506805 msec\nrounds: 20" + }, + { + "name": "benchmarks/tensorclass/test_torch_functions.py::test_cat", + "value": 19.944083486860016, + "unit": "iter/sec", + "range": "stddev: 0.0001350529128640932", + "extra": "mean: 50.140183210667026 msec\nrounds: 19" + } + ] } ] }