-
Notifications
You must be signed in to change notification settings - Fork 109
[BugFix] inline TDParams kwargs in prob modules #1093
New issue
Have a question about this project? Sign up for a free GitHub account to open an issue and contact its maintainers and the community.
By clicking “Sign up for GitHub”, you agree to our terms of service and privacy statement. We’ll occasionally send you account related emails.
Already on GitHub? Sign in to your account
Merged
Merged
Conversation
This file contains hidden or bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
|
| Name | Max | Mean | Ops | Ops on Repo HEAD
|
Change |
|---|---|---|---|---|---|
| test_plain_set_nested | 44.7940μs | 17.0209μs | 58.7513 KOps/s | 60.5200 KOps/s | |
| test_plain_set_stack_nested | 71.0930μs | 17.1299μs | 58.3774 KOps/s | 61.8157 KOps/s | |
| test_plain_set_nested_inplace | 52.4490μs | 18.7441μs | 53.3500 KOps/s | 55.2109 KOps/s | |
| test_plain_set_stack_nested_inplace | 59.7720μs | 18.8086μs | 53.1673 KOps/s | 54.7533 KOps/s | |
| test_items | 35.4260μs | 4.1581μs | 240.4957 KOps/s | 240.7330 KOps/s | |
| test_items_nested | 0.4285ms | 0.3419ms | 2.9248 KOps/s | 2.9419 KOps/s | |
| test_items_nested_locked | 0.5077ms | 0.3383ms | 2.9561 KOps/s | 2.9344 KOps/s | |
| test_items_nested_leaf | 0.1274ms | 72.0472μs | 13.8798 KOps/s | 14.0527 KOps/s | |
| test_items_stack_nested | 0.4682ms | 0.3436ms | 2.9104 KOps/s | 2.9013 KOps/s | |
| test_items_stack_nested_leaf | 0.1555ms | 73.0559μs | 13.6882 KOps/s | 13.4319 KOps/s | |
| test_items_stack_nested_locked | 0.5857ms | 0.3422ms | 2.9224 KOps/s | 2.8897 KOps/s | |
| test_keys | 41.8590μs | 3.5204μs | 284.0599 KOps/s | 283.1702 KOps/s | |
| test_keys_nested | 0.2757ms | 0.1350ms | 7.4056 KOps/s | 7.2372 KOps/s | |
| test_keys_nested_locked | 1.9478ms | 0.1424ms | 7.0236 KOps/s | 7.1179 KOps/s | |
| test_keys_nested_leaf | 0.2002ms | 0.1153ms | 8.6716 KOps/s | 8.6217 KOps/s | |
| test_keys_stack_nested | 0.2306ms | 0.1337ms | 7.4774 KOps/s | 7.5433 KOps/s | |
| test_keys_stack_nested_leaf | 0.2331ms | 0.1144ms | 8.7449 KOps/s | 8.8414 KOps/s | |
| test_keys_stack_nested_locked | 0.2276ms | 0.1390ms | 7.1930 KOps/s | 7.2478 KOps/s | |
| test_values | 9.6522μs | 1.0362μs | 965.1011 KOps/s | 960.7422 KOps/s | |
| test_values_nested | 0.1071ms | 55.3132μs | 18.0789 KOps/s | 18.1809 KOps/s | |
| test_values_nested_locked | 0.1174ms | 55.3683μs | 18.0609 KOps/s | 18.1817 KOps/s | |
| test_values_nested_leaf | 0.1221ms | 60.4286μs | 16.5485 KOps/s | 16.8596 KOps/s | |
| test_values_stack_nested | 0.1258ms | 56.6646μs | 17.6477 KOps/s | 17.5970 KOps/s | |
| test_values_stack_nested_leaf | 0.1309ms | 59.3007μs | 16.8632 KOps/s | 16.8192 KOps/s | |
| test_values_stack_nested_locked | 0.1114ms | 56.7257μs | 17.6287 KOps/s | 17.7248 KOps/s | |
| test_membership | 23.4640μs | 0.8683μs | 1.1516 MOps/s | 1.1771 MOps/s | |
| test_membership_nested | 46.7180μs | 2.7363μs | 365.4634 KOps/s | 364.6063 KOps/s | |
| test_membership_nested_leaf | 53.7310μs | 2.7463μs | 364.1278 KOps/s | 363.5840 KOps/s | |
| test_membership_stacked_nested | 48.7110μs | 2.7044μs | 369.7622 KOps/s | 363.6582 KOps/s | |
| test_membership_stacked_nested_leaf | 46.6370μs | 2.7274μs | 366.6466 KOps/s | 366.4372 KOps/s | |
| test_membership_nested_last | 24.3860μs | 4.0598μs | 246.3206 KOps/s | 249.0799 KOps/s | |
| test_membership_nested_leaf_last | 37.5310μs | 4.1087μs | 243.3838 KOps/s | 248.0511 KOps/s | |
| test_membership_stacked_nested_last | 38.4920μs | 12.9677μs | 77.1149 KOps/s | 77.2761 KOps/s | |
| test_membership_stacked_nested_leaf_last | 69.7200μs | 13.0114μs | 76.8555 KOps/s | 76.0553 KOps/s | |
| test_nested_getleaf | 52.4980μs | 10.5881μs | 94.4452 KOps/s | 92.6528 KOps/s | |
| test_nested_get | 63.0180μs | 10.5168μs | 95.0856 KOps/s | 97.7929 KOps/s | |
| test_stacked_getleaf | 43.5610μs | 10.4894μs | 95.3347 KOps/s | 94.6307 KOps/s | |
| test_stacked_get | 59.7220μs | 10.0712μs | 99.2934 KOps/s | 98.0338 KOps/s | |
| test_nested_getitemleaf | 37.9710μs | 11.1526μs | 89.6654 KOps/s | 88.5519 KOps/s | |
| test_nested_getitem | 60.2230μs | 10.8482μs | 92.1812 KOps/s | 93.4111 KOps/s | |
| test_stacked_getitemleaf | 54.2110μs | 11.0342μs | 90.6269 KOps/s | 90.6276 KOps/s | |
| test_stacked_getitem | 64.3310μs | 10.1847μs | 98.1867 KOps/s | 96.5116 KOps/s | |
| test_lock_nested | 2.9475ms | 0.4483ms | 2.2307 KOps/s | 1.7784 KOps/s | |
| test_lock_stack_nested | 0.5154ms | 0.3990ms | 2.5061 KOps/s | 2.4544 KOps/s | |
| test_unlock_nested | 0.8431ms | 0.3595ms | 2.7818 KOps/s | 2.6662 KOps/s | |
| test_unlock_stack_nested | 0.4383ms | 0.3174ms | 3.1505 KOps/s | 3.0795 KOps/s | |
| test_flatten_speed | 0.1688ms | 91.6184μs | 10.9148 KOps/s | 10.9922 KOps/s | |
| test_unflatten_speed | 0.7963ms | 0.4838ms | 2.0671 KOps/s | 2.1107 KOps/s | |
| test_common_ops | 3.6062ms | 0.7600ms | 1.3158 KOps/s | 1.3733 KOps/s | |
| test_creation | 27.0100μs | 2.1180μs | 472.1448 KOps/s | 482.2876 KOps/s | |
| test_creation_empty | 27.4410μs | 9.3863μs | 106.5379 KOps/s | 116.0004 KOps/s | |
| test_creation_nested_1 | 34.7250μs | 12.1103μs | 82.5743 KOps/s | 88.4671 KOps/s | |
| test_creation_nested_2 | 41.0570μs | 16.4954μs | 60.6231 KOps/s | 64.8241 KOps/s | |
| test_clone | 0.1238ms | 13.2521μs | 75.4595 KOps/s | 72.2513 KOps/s | |
| test_getitem[int] | 0.9457ms | 12.4357μs | 80.4137 KOps/s | 74.9434 KOps/s | |
| test_getitem[slice_int] | 0.1525ms | 24.1306μs | 41.4411 KOps/s | 39.7559 KOps/s | |
| test_getitem[range] | 0.3157ms | 49.4177μs | 20.2357 KOps/s | 20.1457 KOps/s | |
| test_getitem[tuple] | 0.1420ms | 20.0879μs | 49.7812 KOps/s | 48.5710 KOps/s | |
| test_getitem[list] | 0.3194ms | 45.2357μs | 22.1064 KOps/s | 22.1140 KOps/s | |
| test_setitem_dim[int] | 66.7650μs | 26.0614μs | 38.3710 KOps/s | 37.9177 KOps/s | |
| test_setitem_dim[slice_int] | 93.6250μs | 52.2643μs | 19.1335 KOps/s | 19.4676 KOps/s | |
| test_setitem_dim[range] | 0.1184ms | 74.0979μs | 13.4957 KOps/s | 13.4941 KOps/s | |
| test_setitem_dim[tuple] | 89.3270μs | 41.5289μs | 24.0796 KOps/s | 24.3007 KOps/s | |
| test_setitem | 0.1674ms | 19.1600μs | 52.1920 KOps/s | 51.1411 KOps/s | |
| test_set | 0.1285ms | 18.7424μs | 53.3550 KOps/s | 53.2564 KOps/s | |
| test_set_shared | 1.2160ms | 0.1709ms | 5.8526 KOps/s | 5.8707 KOps/s | |
| test_update | 0.2136ms | 20.7687μs | 48.1493 KOps/s | 50.9693 KOps/s | |
| test_update_nested | 0.1892ms | 29.9053μs | 33.4389 KOps/s | 33.3891 KOps/s | |
| test_update__nested | 0.7782ms | 33.8487μs | 29.5433 KOps/s | 29.7803 KOps/s | |
| test_set_nested | 0.1741ms | 20.6007μs | 48.5421 KOps/s | 48.2040 KOps/s | |
| test_set_nested_new | 0.1273ms | 25.2715μs | 39.5702 KOps/s | 39.0155 KOps/s | |
| test_select | 0.2005ms | 41.4676μs | 24.1152 KOps/s | 24.1475 KOps/s | |
| test_select_nested | 0.1175ms | 59.9852μs | 16.6708 KOps/s | 16.0373 KOps/s | |
| test_exclude_nested | 0.1468ms | 75.5860μs | 13.2300 KOps/s | 12.9989 KOps/s | |
| test_empty[True] | 0.6549ms | 0.3591ms | 2.7845 KOps/s | 2.8366 KOps/s | |
| test_empty[False] | 7.4540μs | 1.2399μs | 806.5276 KOps/s | 792.1848 KOps/s | |
| test_unbind_speed | 0.5223ms | 0.2588ms | 3.8637 KOps/s | 3.7954 KOps/s | |
| test_unbind_speed_stack0 | 0.3978ms | 0.2505ms | 3.9926 KOps/s | 3.9852 KOps/s | |
| test_unbind_speed_stack1 | 0.1093s | 0.7557ms | 1.3232 KOps/s | 1.4519 KOps/s | |
| test_split | 0.1087s | 1.7606ms | 567.9792 Ops/s | 560.6796 Ops/s | |
| test_chunk | 2.6454ms | 1.5888ms | 629.4093 Ops/s | 565.3622 Ops/s | |
| test_consolidate_njt[False-None] | 0.1183s | 9.1491ms | 109.3005 Ops/s | 121.3871 Ops/s | |
| test_creation[device0] | 0.4108ms | 91.5754μs | 10.9200 KOps/s | 10.6667 KOps/s | |
| test_creation_from_tensor | 3.3167ms | 95.5803μs | 10.4624 KOps/s | 10.5477 KOps/s | |
| test_add_one[memmap_tensor0] | 0.1705ms | 4.6912μs | 213.1659 KOps/s | 206.3273 KOps/s | |
| test_contiguous[memmap_tensor0] | 11.7120μs | 0.5120μs | 1.9531 MOps/s | 1.9626 MOps/s | |
| test_stack[memmap_tensor0] | 40.2150μs | 3.3769μs | 296.1253 KOps/s | 288.7429 KOps/s | |
| test_memmaptd_index | 1.2822ms | 0.2339ms | 4.2758 KOps/s | 4.0987 KOps/s | |
| test_memmaptd_index_astensor | 0.5480ms | 0.3106ms | 3.2193 KOps/s | 3.1455 KOps/s | |
| test_memmaptd_index_op | 0.9886ms | 0.5576ms | 1.7935 KOps/s | 1.8155 KOps/s | |
| test_serialize_model | 0.1262s | 0.1180s | 8.4718 Ops/s | 7.4164 Ops/s | |
| test_serialize_model_pickle | 0.4591s | 0.3967s | 2.5206 Ops/s | 2.5755 Ops/s | |
| test_serialize_weights | 0.1196s | 0.1144s | 8.7418 Ops/s | 8.6292 Ops/s | |
| test_serialize_weights_returnearly | 0.1684s | 0.1565s | 6.3893 Ops/s | 6.3133 Ops/s | |
| test_serialize_weights_pickle | 1.0905s | 0.8130s | 1.2299 Ops/s | 2.4430 Ops/s | |
| test_serialize_weights_filesystem | 0.1446s | 0.1410s | 7.0897 Ops/s | 6.4137 Ops/s | |
| test_serialize_model_filesystem | 0.1492s | 0.1428s | 7.0019 Ops/s | 6.6085 Ops/s | |
| test_reshape_pytree | 58.8100μs | 26.7371μs | 37.4013 KOps/s | 37.4251 KOps/s | |
| test_reshape_td | 68.9490μs | 33.5094μs | 29.8424 KOps/s | 30.2195 KOps/s | |
| test_view_pytree | 58.1090μs | 27.1004μs | 36.8999 KOps/s | 37.2752 KOps/s | |
| test_view_td | 91.5010μs | 38.2716μs | 26.1290 KOps/s | 25.9519 KOps/s | |
| test_unbind_pytree | 74.8700μs | 30.3288μs | 32.9720 KOps/s | 33.9869 KOps/s | |
| test_unbind_td | 0.3376ms | 38.8607μs | 25.7330 KOps/s | 25.7647 KOps/s | |
| test_split_pytree | 74.3790μs | 29.9882μs | 33.3465 KOps/s | 34.1750 KOps/s | |
| test_split_td | 0.2101ms | 44.0038μs | 22.7253 KOps/s | 22.0370 KOps/s | |
| test_add_pytree | 80.6510μs | 36.5606μs | 27.3518 KOps/s | 27.7915 KOps/s | |
| test_add_td | 0.1545ms | 55.0238μs | 18.1740 KOps/s | 19.2800 KOps/s | |
| test_compile_add_one_nested[tensordict-compile] | 0.1350ms | 62.1085μs | 16.1008 KOps/s | 16.2859 KOps/s | |
| test_compile_add_one_nested[tensordict-eager] | 0.3935ms | 0.1607ms | 6.2234 KOps/s | 6.2297 KOps/s | |
| test_compile_add_one_nested[pytree-compile] | 97.4920μs | 45.7638μs | 21.8513 KOps/s | 22.1748 KOps/s | |
| test_compile_add_one_nested[pytree-eager] | 0.2308ms | 0.1177ms | 8.4942 KOps/s | 8.4900 KOps/s | |
| test_compile_copy_nested[tensordict-compile] | 58.3600μs | 25.7647μs | 38.8128 KOps/s | 38.2003 KOps/s | |
| test_compile_copy_nested[tensordict-eager] | 0.1217ms | 52.9632μs | 18.8810 KOps/s | 18.1821 KOps/s | |
| test_compile_copy_nested[pytree-compile] | 0.1677ms | 78.6416μs | 12.7159 KOps/s | 12.4020 KOps/s | |
| test_compile_copy_nested[pytree-eager] | 0.1227ms | 67.9156μs | 14.7241 KOps/s | 14.5449 KOps/s | |
| test_compile_add_one_flat[tensordict-compile] | 0.1868ms | 0.1041ms | 9.6076 KOps/s | 9.5758 KOps/s | |
| test_compile_add_one_flat[tensordict-eager] | 0.3504ms | 0.1982ms | 5.0443 KOps/s | 5.0752 KOps/s | |
| test_compile_add_one_flat[tensorclass-compile] | 0.1262ms | 45.1706μs | 22.1383 KOps/s | 22.4985 KOps/s | |
| test_compile_add_one_flat[tensorclass-eager] | 0.4774ms | 61.7711μs | 16.1888 KOps/s | 16.5313 KOps/s | |
| test_compile_add_one_flat[pytree-compile] | 0.2215ms | 0.1046ms | 9.5618 KOps/s | 9.9128 KOps/s | |
| test_compile_add_one_flat[pytree-eager] | 0.3707ms | 0.1981ms | 5.0471 KOps/s | 4.9779 KOps/s | |
| test_compile_add_self_flat[tensordict-eager] | 0.4253ms | 0.2115ms | 4.7292 KOps/s | 4.8095 KOps/s | |
| test_compile_add_self_flat[tensordict-compile] | 0.2077ms | 0.1058ms | 9.4500 KOps/s | 9.5557 KOps/s | |
| test_compile_add_self_flat[tensorclass-eager] | 0.1908ms | 56.5995μs | 17.6680 KOps/s | 18.2498 KOps/s | |
| test_compile_add_self_flat[tensorclass-compile] | 0.1011ms | 46.3239μs | 21.5871 KOps/s | 22.0298 KOps/s | |
| test_compile_add_self_flat[pytree-eager] | 0.6108ms | 0.1584ms | 6.3141 KOps/s | 6.3581 KOps/s | |
| test_compile_add_self_flat[pytree-compile] | 0.1874ms | 0.1022ms | 9.7872 KOps/s | 9.5481 KOps/s | |
| test_compile_copy_flat[tensordict-compile] | 70.6630μs | 21.2933μs | 46.9631 KOps/s | 48.1566 KOps/s | |
| test_compile_copy_flat[tensordict-eager] | 0.1696ms | 58.7231μs | 17.0291 KOps/s | 17.0861 KOps/s | |
| test_compile_copy_flat[pytree-compile] | 0.1716ms | 80.2664μs | 12.4585 KOps/s | 12.3154 KOps/s | |
| test_compile_copy_flat[pytree-eager] | 0.1267ms | 68.5524μs | 14.5874 KOps/s | 14.4880 KOps/s | |
| test_compile_assign_and_add[tensordict-compile] | 0.3061ms | 0.2057ms | 4.8615 KOps/s | 4.8072 KOps/s | |
| test_compile_assign_and_add[tensordict-eager] | 2.2709ms | 1.3067ms | 765.3133 Ops/s | 788.0408 Ops/s | |
| test_compile_assign_and_add[pytree-compile] | 0.4324ms | 0.2055ms | 4.8653 KOps/s | 5.0326 KOps/s | |
| test_compile_assign_and_add[pytree-eager] | 1.0275ms | 0.7699ms | 1.2989 KOps/s | 1.3055 KOps/s | |
| test_compile_assign_and_add_stack[compile] | 0.8030ms | 0.4539ms | 2.2031 KOps/s | 2.1929 KOps/s | |
| test_compile_assign_and_add_stack[eager] | 2.7934ms | 2.5638ms | 390.0510 Ops/s | 407.1632 Ops/s | |
| test_compile_indexing[tensor-tensordict-compile] | 0.1103ms | 36.2405μs | 27.5935 KOps/s | 28.8401 KOps/s | |
| test_compile_indexing[tensor-tensordict-eager] | 0.6580ms | 35.1869μs | 28.4196 KOps/s | 29.0805 KOps/s | |
| test_compile_indexing[tensor-tensorclass-compile] | 0.1151ms | 29.7647μs | 33.5969 KOps/s | 34.6921 KOps/s | |
| test_compile_indexing[tensor-tensorclass-eager] | 70.2810μs | 24.0189μs | 41.6338 KOps/s | 41.6456 KOps/s | |
| test_compile_indexing[tensor-pytree-compile] | 71.6740μs | 30.5517μs | 32.7314 KOps/s | 34.0039 KOps/s | |
| test_compile_indexing[tensor-pytree-eager] | 0.2593ms | 23.6957μs | 42.2018 KOps/s | 42.6552 KOps/s | |
| test_compile_indexing[slice-tensordict-compile] | 0.1479ms | 50.7442μs | 19.7067 KOps/s | 20.1227 KOps/s | |
| test_compile_indexing[slice-tensordict-eager] | 0.6633ms | 20.2603μs | 49.3577 KOps/s | 47.7310 KOps/s | |
| test_compile_indexing[slice-tensorclass-compile] | 0.1039ms | 43.3627μs | 23.0613 KOps/s | 23.7706 KOps/s | |
| test_compile_indexing[slice-tensorclass-eager] | 64.4810μs | 19.2862μs | 51.8506 KOps/s | 53.1526 KOps/s | |
| test_compile_indexing[slice-pytree-compile] | 0.1023ms | 44.7522μs | 22.3453 KOps/s | 23.1653 KOps/s | |
| test_compile_indexing[slice-pytree-eager] | 61.4550μs | 19.0425μs | 52.5142 KOps/s | 51.3691 KOps/s | |
| test_compile_indexing[int-tensordict-compile] | 0.1332ms | 51.4017μs | 19.4546 KOps/s | 19.7853 KOps/s | |
| test_compile_indexing[int-tensordict-eager] | 0.8666ms | 20.1314μs | 49.6736 KOps/s | 47.6339 KOps/s | |
| test_compile_indexing[int-tensorclass-compile] | 0.1383ms | 43.9527μs | 22.7517 KOps/s | 23.0675 KOps/s | |
| test_compile_indexing[int-tensorclass-eager] | 65.9630μs | 19.0040μs | 52.6206 KOps/s | 53.0393 KOps/s | |
| test_compile_indexing[int-pytree-compile] | 0.1055ms | 44.0668μs | 22.6928 KOps/s | 22.7502 KOps/s | |
| test_compile_indexing[int-pytree-eager] | 1.3169ms | 19.0316μs | 52.5442 KOps/s | 53.1920 KOps/s | |
| test_mod_add[eager] | 73.9380μs | 26.4010μs | 37.8774 KOps/s | 40.3640 KOps/s | |
| test_mod_add[compile] | 99.4560μs | 44.2393μs | 22.6043 KOps/s | 23.0797 KOps/s | |
| test_mod_add[compile-overhead] | 0.1263ms | 44.1857μs | 22.6317 KOps/s | 23.0329 KOps/s | |
| test_mod_wrap[eager] | 0.3397ms | 0.2170ms | 4.6087 KOps/s | 4.6905 KOps/s | |
| test_mod_wrap[compile] | 1.7772ms | 0.2050ms | 4.8778 KOps/s | 4.8844 KOps/s | |
| test_mod_wrap[compile-overhead] | 1.7139ms | 0.2016ms | 4.9604 KOps/s | 4.9094 KOps/s | |
| test_mod_wrap_and_backward[eager] | 14.5358ms | 11.7352ms | 85.2136 Ops/s | 85.9812 Ops/s | |
| test_mod_wrap_and_backward[compile] | 18.4488ms | 12.7650ms | 78.3391 Ops/s | 76.0079 Ops/s | |
| test_mod_wrap_and_backward[compile-overhead] | 16.9986ms | 12.4774ms | 80.1447 Ops/s | 78.2818 Ops/s | |
| test_seq_add[eager] | 0.2113ms | 89.5674μs | 11.1648 KOps/s | 11.4799 KOps/s | |
| test_seq_add[compile] | 0.1453ms | 59.0855μs | 16.9246 KOps/s | 16.5791 KOps/s | |
| test_seq_add[compile-overhead] | 0.1142ms | 56.6413μs | 17.6550 KOps/s | 17.1696 KOps/s | |
| test_seq_wrap[eager] | 0.6852ms | 0.3930ms | 2.5444 KOps/s | 2.5827 KOps/s | |
| test_seq_wrap[compile] | 0.4369ms | 0.2251ms | 4.4416 KOps/s | 4.3899 KOps/s | |
| test_seq_wrap[compile-overhead] | 0.4535ms | 0.2250ms | 4.4449 KOps/s | 4.4081 KOps/s | |
| test_func_call_runtime[False-eager] | 0.9912ms | 0.5664ms | 1.7656 KOps/s | 1.7896 KOps/s | |
| test_func_call_runtime[False-compile] | 0.7753ms | 0.4299ms | 2.3260 KOps/s | 2.3450 KOps/s | |
| test_func_call_runtime[False-compile-overhead] | 0.6029ms | 0.4270ms | 2.3418 KOps/s | 2.3272 KOps/s | |
| test_func_call_runtime[True-eager] | 1.3349ms | 0.7738ms | 1.2923 KOps/s | 1.3134 KOps/s | |
| test_func_call_runtime[True-compile] | 0.8213ms | 0.4727ms | 2.1153 KOps/s | 2.1390 KOps/s | |
| test_func_call_runtime[True-compile-overhead] | 0.7399ms | 0.4684ms | 2.1349 KOps/s | 2.1259 KOps/s | |
| test_func_call_cm_runtime[False-eager] | 0.9964ms | 0.5582ms | 1.7914 KOps/s | 1.8424 KOps/s | |
| test_func_call_cm_runtime[False-compile] | 0.7918ms | 0.4275ms | 2.3394 KOps/s | 2.3343 KOps/s | |
| test_func_call_cm_runtime[False-compile-overhead] | 0.5437ms | 0.4251ms | 2.3527 KOps/s | 2.3598 KOps/s | |
| test_func_call_cm_runtime[True-eager] | 1.4222ms | 0.9081ms | 1.1012 KOps/s | 1.1181 KOps/s | |
| test_func_call_cm_runtime[True-compile] | 0.6200ms | 0.4883ms | 2.0478 KOps/s | 1.9980 KOps/s | |
| test_func_call_cm_runtime[True-compile-overhead] | 0.7939ms | 0.4917ms | 2.0338 KOps/s | 2.0185 KOps/s | |
| test_vmap_func_call_cm_runtime[eager] | 2.8016ms | 1.9080ms | 524.1126 Ops/s | 513.9155 Ops/s | |
| test_vmap_func_call_cm_runtime[compile] | 0.8123ms | 0.5201ms | 1.9228 KOps/s | 1.9232 KOps/s | |
| test_vmap_func_call_cm_runtime[compile-overhead] | 0.7031ms | 0.5251ms | 1.9044 KOps/s | 1.9458 KOps/s | |
| test_distributed | 0.4379ms | 0.1289ms | 7.7599 KOps/s | 7.6300 KOps/s | |
| test_tdmodule | 31.8200μs | 17.5512μs | 56.9763 KOps/s | 58.4691 KOps/s | |
| test_tdmodule_dispatch | 58.0490μs | 34.8918μs | 28.6600 KOps/s | 29.8555 KOps/s | |
| test_tdseq | 47.6190μs | 20.7676μs | 48.1520 KOps/s | 51.2708 KOps/s | |
| test_tdseq_dispatch | 71.4240μs | 40.8161μs | 24.5002 KOps/s | 25.4599 KOps/s | |
| test_instantiation_functorch | 2.0274ms | 1.5604ms | 640.8768 Ops/s | 652.3588 Ops/s | |
| test_exec_functorch | 0.3735ms | 0.1836ms | 5.4456 KOps/s | 5.6138 KOps/s | |
| test_exec_functional_call | 0.3418ms | 0.1751ms | 5.7111 KOps/s | 5.8838 KOps/s | |
| test_exec_td_decorator | 0.5827ms | 0.2351ms | 4.2534 KOps/s | 4.4211 KOps/s | |
| test_vmap_mlp_speed_decorator[True-True] | 1.0428ms | 0.6344ms | 1.5762 KOps/s | 1.5505 KOps/s | |
| test_vmap_mlp_speed_decorator[True-False] | 0.8559ms | 0.6335ms | 1.5786 KOps/s | 1.5803 KOps/s | |
| test_vmap_mlp_speed_decorator[False-True] | 0.9974ms | 0.5444ms | 1.8368 KOps/s | 1.9283 KOps/s | |
| test_vmap_mlp_speed_decorator[False-False] | 0.9010ms | 0.5316ms | 1.8813 KOps/s | 1.9312 KOps/s | |
| test_to_module_speed[True] | 1.9509ms | 1.3080ms | 764.5547 Ops/s | 774.4690 Ops/s | |
| test_to_module_speed[False] | 1.4068ms | 1.2742ms | 784.8285 Ops/s | 806.2115 Ops/s | |
| test_tc_init | 91.8220μs | 43.9892μs | 22.7329 KOps/s | 23.1141 KOps/s | |
| test_tc_init_nested | 0.2335ms | 87.4054μs | 11.4409 KOps/s | 11.6947 KOps/s | |
| test_tc_first_layer_tensor | 22.8330μs | 1.5231μs | 656.5735 KOps/s | 645.2428 KOps/s | |
| test_tc_first_layer_nontensor | 30.7170μs | 4.7015μs | 212.6989 KOps/s | 206.9444 KOps/s | |
| test_tc_second_layer_tensor | 26.4290μs | 2.8001μs | 357.1332 KOps/s | 345.8553 KOps/s | |
| test_tc_second_layer_nontensor | 37.6210μs | 6.1633μs | 162.2503 KOps/s | 166.3035 KOps/s | |
| test_unbind | 0.2335s | 15.2111ms | 65.7416 Ops/s | 78.6649 Ops/s | |
| test_full_like | 9.0690ms | 7.6584ms | 130.5756 Ops/s | 129.7557 Ops/s | |
| test_zeros_like | 3.8308ms | 2.9296ms | 341.3482 Ops/s | 320.8785 Ops/s | |
| test_ones_like | 4.1946ms | 3.5890ms | 278.6262 Ops/s | 292.0185 Ops/s | |
| test_clone | 6.1695ms | 5.3163ms | 188.1019 Ops/s | 189.0224 Ops/s | |
| test_squeeze | 79.8190μs | 11.6339μs | 85.9559 KOps/s | 84.6659 KOps/s | |
| test_unsqueeze | 0.2102ms | 86.1922μs | 11.6020 KOps/s | 11.2416 KOps/s | |
| test_split | 0.3436ms | 0.1821ms | 5.4916 KOps/s | 5.2006 KOps/s | |
| test_permute | 0.4385ms | 0.2192ms | 4.5613 KOps/s | 4.5185 KOps/s | |
| test_stack | 31.5820ms | 25.5589ms | 39.1253 Ops/s | 39.2093 Ops/s | |
| test_cat | 30.9127ms | 25.0971ms | 39.8452 Ops/s | 39.1180 Ops/s |
|
| Name | Max | Mean | Ops | Ops on Repo HEAD
|
Change |
|---|---|---|---|---|---|
| test_plain_set_nested | 52.0910μs | 10.4844μs | 95.3794 KOps/s | 92.9681 KOps/s | |
| test_plain_set_stack_nested | 33.4910μs | 10.6012μs | 94.3293 KOps/s | 91.5611 KOps/s | |
| test_plain_set_nested_inplace | 35.5610μs | 11.5000μs | 86.9569 KOps/s | 83.2251 KOps/s | |
| test_plain_set_stack_nested_inplace | 38.6910μs | 11.5317μs | 86.7178 KOps/s | 83.8048 KOps/s | |
| test_items | 26.6610μs | 2.8876μs | 346.3064 KOps/s | 340.2368 KOps/s | |
| test_items_nested | 0.3747ms | 0.3221ms | 3.1042 KOps/s | 3.1099 KOps/s | |
| test_items_nested_locked | 0.3845ms | 0.3247ms | 3.0802 KOps/s | 3.0927 KOps/s | |
| test_items_nested_leaf | 87.2020μs | 58.5880μs | 17.0683 KOps/s | 17.1567 KOps/s | |
| test_items_stack_nested | 0.4427ms | 0.3239ms | 3.0872 KOps/s | 3.1038 KOps/s | |
| test_items_stack_nested_leaf | 86.7020μs | 59.0473μs | 16.9356 KOps/s | 16.8297 KOps/s | |
| test_items_stack_nested_locked | 0.3739ms | 0.3247ms | 3.0793 KOps/s | 3.1234 KOps/s | |
| test_keys | 26.9510μs | 3.5555μs | 281.2573 KOps/s | 282.6549 KOps/s | |
| test_keys_nested | 0.1008ms | 70.9216μs | 14.1001 KOps/s | 14.1320 KOps/s | |
| test_keys_nested_locked | 3.0031ms | 76.5011μs | 13.0717 KOps/s | 13.1056 KOps/s | |
| test_keys_nested_leaf | 90.8020μs | 62.0860μs | 16.1067 KOps/s | 16.1739 KOps/s | |
| test_keys_stack_nested | 0.1001ms | 71.5000μs | 13.9860 KOps/s | 14.1828 KOps/s | |
| test_keys_stack_nested_leaf | 90.9420μs | 62.6418μs | 15.9638 KOps/s | 16.3240 KOps/s | |
| test_keys_stack_nested_locked | 0.1150ms | 76.1913μs | 13.1249 KOps/s | 13.2626 KOps/s | |
| test_values | 5.9818μs | 0.8437μs | 1.1853 MOps/s | 1.1790 MOps/s | |
| test_values_nested | 65.1220μs | 32.9726μs | 30.3282 KOps/s | 30.6302 KOps/s | |
| test_values_nested_locked | 80.9420μs | 35.0972μs | 28.4923 KOps/s | 28.9055 KOps/s | |
| test_values_nested_leaf | 63.1520μs | 35.3236μs | 28.3097 KOps/s | 28.5778 KOps/s | |
| test_values_stack_nested | 66.0110μs | 33.2298μs | 30.0935 KOps/s | 30.2185 KOps/s | |
| test_values_stack_nested_leaf | 64.7810μs | 35.5095μs | 28.1615 KOps/s | 27.9958 KOps/s | |
| test_values_stack_nested_locked | 62.7420μs | 35.0631μs | 28.5200 KOps/s | 28.8444 KOps/s | |
| test_membership | 2.0171μs | 0.5626μs | 1.7773 MOps/s | 1.7746 MOps/s | |
| test_membership_nested | 18.8005μs | 1.9634μs | 509.3230 KOps/s | 483.5504 KOps/s | |
| test_membership_nested_leaf | 21.4305μs | 1.9939μs | 501.5251 KOps/s | 495.3653 KOps/s | |
| test_membership_stacked_nested | 29.3800μs | 2.0773μs | 481.3910 KOps/s | 476.8038 KOps/s | |
| test_membership_stacked_nested_leaf | 45.1410μs | 2.0924μs | 477.9251 KOps/s | 477.3484 KOps/s | |
| test_membership_nested_last | 38.7600μs | 2.9995μs | 333.3891 KOps/s | 332.8496 KOps/s | |
| test_membership_nested_leaf_last | 33.1510μs | 2.9939μs | 334.0143 KOps/s | 334.5355 KOps/s | |
| test_membership_stacked_nested_last | 49.4120μs | 3.0219μs | 330.9176 KOps/s | 124.6210 KOps/s | |
| test_membership_stacked_nested_leaf_last | 34.0600μs | 2.9915μs | 334.2854 KOps/s | 123.6727 KOps/s | |
| test_nested_getleaf | 47.9810μs | 6.0129μs | 166.3078 KOps/s | 165.1098 KOps/s | |
| test_nested_get | 44.7710μs | 5.7127μs | 175.0496 KOps/s | 174.3934 KOps/s | |
| test_stacked_getleaf | 48.3210μs | 6.0200μs | 166.1118 KOps/s | 166.4425 KOps/s | |
| test_stacked_get | 29.3510μs | 5.6861μs | 175.8665 KOps/s | 176.1958 KOps/s | |
| test_nested_getitemleaf | 34.3810μs | 6.0875μs | 164.2702 KOps/s | 162.2623 KOps/s | |
| test_nested_getitem | 79.9820μs | 5.8047μs | 172.2739 KOps/s | 171.3235 KOps/s | |
| test_stacked_getitemleaf | 35.7310μs | 6.2428μs | 160.1842 KOps/s | 161.9391 KOps/s | |
| test_stacked_getitem | 36.3810μs | 5.7360μs | 174.3384 KOps/s | 171.9820 KOps/s | |
| test_lock_nested | 7.1426ms | 0.3741ms | 2.6729 KOps/s | 2.6004 KOps/s | |
| test_lock_stack_nested | 0.3670ms | 0.3397ms | 2.9434 KOps/s | 2.9318 KOps/s | |
| test_unlock_nested | 0.6639ms | 0.3077ms | 3.2497 KOps/s | 3.1592 KOps/s | |
| test_unlock_stack_nested | 0.3180ms | 0.2756ms | 3.6290 KOps/s | 3.6190 KOps/s | |
| test_flatten_speed | 0.1102ms | 73.3818μs | 13.6274 KOps/s | 13.5164 KOps/s | |
| test_unflatten_speed | 0.4583ms | 0.2985ms | 3.3498 KOps/s | 3.3670 KOps/s | |
| test_common_ops | 1.7531ms | 0.5829ms | 1.7155 KOps/s | 1.6101 KOps/s | |
| test_creation | 0.1095ms | 1.5304μs | 653.4371 KOps/s | 612.8121 KOps/s | |
| test_creation_empty | 30.5410μs | 7.1516μs | 139.8286 KOps/s | 126.1763 KOps/s | |
| test_creation_nested_1 | 38.0010μs | 8.7791μs | 113.9068 KOps/s | 103.8971 KOps/s | |
| test_creation_nested_2 | 52.8910μs | 11.2149μs | 89.1670 KOps/s | 82.6883 KOps/s | |
| test_clone | 55.6320μs | 10.4433μs | 95.7549 KOps/s | 86.2156 KOps/s | |
| test_getitem[int] | 93.2138ms | 15.8266μs | 63.1847 KOps/s | 91.3413 KOps/s | |
| test_getitem[slice_int] | 0.1085ms | 20.7503μs | 48.1922 KOps/s | 46.6031 KOps/s | |
| test_getitem[range] | 0.1281ms | 37.0807μs | 26.9682 KOps/s | 25.8754 KOps/s | |
| test_getitem[tuple] | 0.1125ms | 18.0039μs | 55.5435 KOps/s | 54.5767 KOps/s | |
| test_getitem[list] | 0.1905ms | 32.6393μs | 30.6379 KOps/s | 29.2925 KOps/s | |
| test_setitem_dim[int] | 42.4710μs | 18.4172μs | 54.2972 KOps/s | 50.4451 KOps/s | |
| test_setitem_dim[slice_int] | 60.2110μs | 37.1147μs | 26.9435 KOps/s | 25.5399 KOps/s | |
| test_setitem_dim[range] | 85.6620μs | 52.8885μs | 18.9077 KOps/s | 18.3061 KOps/s | |
| test_setitem_dim[tuple] | 59.9210μs | 31.1280μs | 32.1254 KOps/s | 30.1871 KOps/s | |
| test_setitem | 90.6820μs | 14.2341μs | 70.2539 KOps/s | 60.7878 KOps/s | |
| test_set | 80.9920μs | 13.6938μs | 73.0258 KOps/s | 62.7806 KOps/s | |
| test_set_shared | 1.6364ms | 0.1460ms | 6.8494 KOps/s | 6.6959 KOps/s | |
| test_update | 0.4448ms | 16.2043μs | 61.7120 KOps/s | 53.2092 KOps/s | |
| test_update_nested | 96.7620μs | 20.6063μs | 48.5288 KOps/s | 42.4408 KOps/s | |
| test_update__nested | 0.9249ms | 24.4479μs | 40.9033 KOps/s | 37.1535 KOps/s | |
| test_set_nested | 79.1720μs | 14.9635μs | 66.8294 KOps/s | 59.7182 KOps/s | |
| test_set_nested_new | 91.9420μs | 17.9374μs | 55.7494 KOps/s | 51.8081 KOps/s | |
| test_select | 98.4630μs | 29.8564μs | 33.4937 KOps/s | 31.6128 KOps/s | |
| test_select_nested | 78.2010μs | 43.0496μs | 23.2290 KOps/s | 22.8247 KOps/s | |
| test_exclude_nested | 0.1048ms | 60.4660μs | 16.5382 KOps/s | 16.7000 KOps/s | |
| test_empty[True] | 0.6772ms | 0.2579ms | 3.8780 KOps/s | 3.8610 KOps/s | |
| test_empty[False] | 3.5740μs | 0.7533μs | 1.3275 MOps/s | 1.3392 MOps/s | |
| test_to | 86.4520μs | 55.1413μs | 18.1352 KOps/s | 17.6501 KOps/s | |
| test_to_nonblocking | 96.6620μs | 47.7865μs | 20.9264 KOps/s | 19.7414 KOps/s | |
| test_unbind_speed | 0.8570ms | 0.2308ms | 4.3336 KOps/s | 4.1182 KOps/s | |
| test_unbind_speed_stack0 | 0.2953ms | 0.2310ms | 4.3290 KOps/s | 4.2712 KOps/s | |
| test_unbind_speed_stack1 | 92.6371ms | 0.6515ms | 1.5348 KOps/s | 1.5460 KOps/s | |
| test_split | 93.9772ms | 1.7063ms | 586.0779 Ops/s | 573.0825 Ops/s | |
| test_chunk | 1.6453ms | 1.4380ms | 695.3940 Ops/s | 681.1952 Ops/s | |
| test_consolidate[False-None] | 96.9589ms | 2.8557ms | 350.1729 Ops/s | 351.3443 Ops/s | |
| test_consolidate[default-None] | 1.7267ms | 1.6438ms | 608.3599 Ops/s | 595.6919 Ops/s | |
| test_consolidate[reduce-overhead-None] | 1.7626ms | 1.6776ms | 596.1018 Ops/s | 586.6866 Ops/s | |
| test_consolidate_njt[False-None] | 6.8750ms | 6.5660ms | 152.3008 Ops/s | 148.7848 Ops/s | |
| test_to[False-False-None] | 1.7698ms | 1.6933ms | 590.5573 Ops/s | 567.3522 Ops/s | |
| test_to[True-False-None] | 1.4884ms | 1.2611ms | 792.9763 Ops/s | 754.9994 Ops/s | |
| test_to[within-False-None] | 4.0899ms | 3.9961ms | 250.2452 Ops/s | 246.7359 Ops/s | |
| test_to[True-default-None] | 5.3391ms | 5.1124ms | 195.6021 Ops/s | 186.5155 Ops/s | |
| test_to_njt[False-False-None] | 7.3897ms | 7.0326ms | 142.1954 Ops/s | 135.2293 Ops/s | |
| test_to_njt[True-False-None] | 5.6794ms | 5.5091ms | 181.5182 Ops/s | 174.1128 Ops/s | |
| test_to_njt[within-False-None] | 12.4228ms | 12.1905ms | 82.0312 Ops/s | 80.1927 Ops/s | |
| test_creation[device0] | 0.7438ms | 79.1993μs | 12.6264 KOps/s | 12.4980 KOps/s | |
| test_creation_from_tensor | 0.5490ms | 82.0163μs | 12.1927 KOps/s | 11.4867 KOps/s | |
| test_add_one[memmap_tensor0] | 0.4209ms | 6.6742μs | 149.8296 KOps/s | 138.4105 KOps/s | |
| test_contiguous[memmap_tensor0] | 1.8140μs | 0.4019μs | 2.4883 MOps/s | 1.7634 MOps/s | |
| test_stack[memmap_tensor0] | 35.7610μs | 4.4437μs | 225.0372 KOps/s | 221.8301 KOps/s | |
| test_memmaptd_index | 1.6923ms | 0.2571ms | 3.8894 KOps/s | 4.0000 KOps/s | |
| test_memmaptd_index_astensor | 0.6163ms | 0.3211ms | 3.1144 KOps/s | 3.1687 KOps/s | |
| test_memmaptd_index_op | 0.9994ms | 0.5743ms | 1.7413 KOps/s | 1.6495 KOps/s | |
| test_serialize_model | 0.1312s | 0.1303s | 7.6748 Ops/s | 7.6664 Ops/s | |
| test_serialize_model_pickle | 1.3594s | 1.2148s | 0.8232 Ops/s | 0.8435 Ops/s | |
| test_serialize_weights | 0.1304s | 0.1292s | 7.7390 Ops/s | 5.4775 Ops/s | |
| test_serialize_weights_returnearly | 0.3042s | 54.1150ms | 18.4792 Ops/s | 23.0167 Ops/s | |
| test_serialize_weights_pickle | 1.3778s | 1.1902s | 0.8402 Ops/s | 0.8222 Ops/s | |
| test_reshape_pytree | 0.4019ms | 22.6028μs | 44.2423 KOps/s | 43.4891 KOps/s | |
| test_reshape_td | 58.9020μs | 26.8282μs | 37.2742 KOps/s | 35.7096 KOps/s | |
| test_view_pytree | 58.0520μs | 22.4202μs | 44.6026 KOps/s | 43.2995 KOps/s | |
| test_view_td | 0.4086ms | 29.4448μs | 33.9618 KOps/s | 31.1013 KOps/s | |
| test_unbind_pytree | 49.3510μs | 28.2129μs | 35.4448 KOps/s | 33.3714 KOps/s | |
| test_unbind_td | 0.7498ms | 35.7749μs | 27.9525 KOps/s | 25.5871 KOps/s | |
| test_split_pytree | 59.7020μs | 30.4579μs | 32.8322 KOps/s | 29.9090 KOps/s | |
| test_split_td | 0.7780ms | 38.4742μs | 25.9914 KOps/s | 24.2128 KOps/s | |
| test_add_pytree | 68.9210μs | 34.9156μs | 28.6405 KOps/s | 25.3388 KOps/s | |
| test_add_td | 0.4439ms | 46.0295μs | 21.7252 KOps/s | 18.2770 KOps/s | |
| test_compile_add_one_nested[tensordict-compile] | 0.1723ms | 0.1215ms | 8.2303 KOps/s | 8.0136 KOps/s | |
| test_compile_add_one_nested[tensordict-eager] | 0.2456ms | 0.1302ms | 7.6780 KOps/s | 7.6674 KOps/s | |
| test_compile_add_one_nested[pytree-compile] | 0.4720ms | 97.6817μs | 10.2373 KOps/s | 10.2105 KOps/s | |
| test_compile_add_one_nested[pytree-eager] | 1.4496ms | 0.1518ms | 6.5898 KOps/s | 6.3363 KOps/s | |
| test_compile_copy_nested[tensordict-compile] | 0.4126ms | 23.7841μs | 42.0448 KOps/s | 41.2404 KOps/s | |
| test_compile_copy_nested[tensordict-eager] | 0.4116ms | 27.2279μs | 36.7270 KOps/s | 35.3649 KOps/s | |
| test_compile_copy_nested[pytree-compile] | 0.4466ms | 66.9424μs | 14.9382 KOps/s | 14.9450 KOps/s | |
| test_compile_copy_nested[pytree-eager] | 0.4273ms | 51.2039μs | 19.5298 KOps/s | 19.3040 KOps/s | |
| test_compile_add_one_flat[tensordict-compile] | 0.1823ms | 0.1428ms | 7.0040 KOps/s | 6.8175 KOps/s | |
| test_compile_add_one_flat[tensordict-eager] | 0.6061ms | 0.2139ms | 4.6760 KOps/s | 4.6640 KOps/s | |
| test_compile_add_one_flat[tensorclass-compile] | 0.5109ms | 98.5159μs | 10.1506 KOps/s | 10.0575 KOps/s | |
| test_compile_add_one_flat[tensorclass-eager] | 0.4475ms | 52.4832μs | 19.0537 KOps/s | 18.4079 KOps/s | |
| test_compile_add_one_flat[pytree-compile] | 0.1944ms | 0.1368ms | 7.3108 KOps/s | 7.1949 KOps/s | |
| test_compile_add_one_flat[pytree-eager] | 0.8633ms | 0.4797ms | 2.0846 KOps/s | 2.0028 KOps/s | |
| test_compile_add_self_flat[tensordict-eager] | 0.6324ms | 0.2550ms | 3.9210 KOps/s | 3.8819 KOps/s | |
| test_compile_add_self_flat[tensordict-compile] | 0.1842ms | 0.1451ms | 6.8913 KOps/s | 6.8707 KOps/s | |
| test_compile_add_self_flat[tensorclass-eager] | 0.1399ms | 62.7009μs | 15.9487 KOps/s | 15.1838 KOps/s | |
| test_compile_add_self_flat[tensorclass-compile] | 0.1427ms | 99.2836μs | 10.0722 KOps/s | 9.9824 KOps/s | |
| test_compile_add_self_flat[pytree-eager] | 0.7920ms | 0.4099ms | 2.4395 KOps/s | 2.3795 KOps/s | |
| test_compile_add_self_flat[pytree-compile] | 0.1725ms | 0.1365ms | 7.3256 KOps/s | 7.3530 KOps/s | |
| test_compile_copy_flat[tensordict-compile] | 51.3610μs | 19.1881μs | 52.1155 KOps/s | 53.2675 KOps/s | |
| test_compile_copy_flat[tensordict-eager] | 0.3978ms | 27.5283μs | 36.3263 KOps/s | 35.4477 KOps/s | |
| test_compile_copy_flat[pytree-compile] | 0.4426ms | 69.6551μs | 14.3565 KOps/s | 14.2530 KOps/s | |
| test_compile_copy_flat[pytree-eager] | 0.4146ms | 52.2845μs | 19.1261 KOps/s | 19.1529 KOps/s | |
| test_compile_assign_and_add[tensordict-compile] | 1.6496ms | 0.3967ms | 2.5208 KOps/s | 2.2150 KOps/s | |
| test_compile_assign_and_add[tensordict-eager] | 2.8754ms | 2.5725ms | 388.7203 Ops/s | 369.8914 Ops/s | |
| test_compile_assign_and_add[pytree-compile] | 1.6045ms | 0.3843ms | 2.6020 KOps/s | 2.2311 KOps/s | |
| test_compile_assign_and_add[pytree-eager] | 2.7652ms | 2.6181ms | 381.9562 Ops/s | 363.4155 Ops/s | |
| test_compile_indexing[tensor-tensordict-compile] | 0.1754ms | 0.1193ms | 8.3831 KOps/s | 8.5797 KOps/s | |
| test_compile_indexing[tensor-tensordict-eager] | 0.5872ms | 83.5399μs | 11.9703 KOps/s | 11.9588 KOps/s | |
| test_compile_indexing[tensor-tensorclass-compile] | 0.1684ms | 0.1084ms | 9.2254 KOps/s | 9.2584 KOps/s | |
| test_compile_indexing[tensor-tensorclass-eager] | 0.1759ms | 70.7248μs | 14.1393 KOps/s | 14.0956 KOps/s | |
| test_compile_indexing[tensor-pytree-compile] | 0.2154ms | 0.1109ms | 9.0138 KOps/s | 9.2368 KOps/s | |
| test_compile_indexing[tensor-pytree-eager] | 0.1102ms | 72.4620μs | 13.8003 KOps/s | 14.1005 KOps/s | |
| test_compile_indexing[slice-tensordict-compile] | 0.2162ms | 0.1032ms | 9.6893 KOps/s | 9.7720 KOps/s | |
| test_compile_indexing[slice-tensordict-eager] | 0.1426ms | 17.0361μs | 58.6989 KOps/s | 54.6586 KOps/s | |
| test_compile_indexing[slice-tensorclass-compile] | 0.1485ms | 98.3474μs | 10.1680 KOps/s | 10.1583 KOps/s | |
| test_compile_indexing[slice-tensorclass-eager] | 67.8610μs | 16.1262μs | 62.0108 KOps/s | 60.2145 KOps/s | |
| test_compile_indexing[slice-pytree-compile] | 0.1517ms | 98.5377μs | 10.1484 KOps/s | 10.0767 KOps/s | |
| test_compile_indexing[slice-pytree-eager] | 51.8920μs | 15.9462μs | 62.7108 KOps/s | 60.6203 KOps/s | |
| test_compile_indexing[int-tensordict-compile] | 0.1699ms | 0.1055ms | 9.4797 KOps/s | 9.6738 KOps/s | |
| test_compile_indexing[int-tensordict-eager] | 0.5822ms | 17.1686μs | 58.2459 KOps/s | 54.7100 KOps/s | |
| test_compile_indexing[int-tensorclass-compile] | 0.1574ms | 0.1012ms | 9.8858 KOps/s | 10.0681 KOps/s | |
| test_compile_indexing[int-tensorclass-eager] | 78.2010μs | 15.8987μs | 62.8982 KOps/s | 60.2022 KOps/s | |
| test_compile_indexing[int-pytree-compile] | 0.1641ms | 0.1016ms | 9.8388 KOps/s | 10.0597 KOps/s | |
| test_compile_indexing[int-pytree-eager] | 48.1810μs | 17.1370μs | 58.3532 KOps/s | 60.7214 KOps/s | |
| test_mod_add[eager] | 0.1623ms | 30.9120μs | 32.3499 KOps/s | 29.8291 KOps/s | |
| test_mod_add[compile] | 0.1637ms | 78.2672μs | 12.7767 KOps/s | 12.5083 KOps/s | |
| test_mod_add[compile-overhead] | 0.3136ms | 0.1633ms | 6.1242 KOps/s | 5.6556 KOps/s | |
| test_mod_wrap[eager] | 0.3229ms | 0.2419ms | 4.1331 KOps/s | 4.0043 KOps/s | |
| test_mod_wrap[compile] | 1.5628ms | 0.2820ms | 3.5457 KOps/s | 3.4330 KOps/s | |
| test_mod_wrap[compile-overhead] | 7.8031ms | 4.0129ms | 249.1993 Ops/s | 253.2873 Ops/s | |
| test_mod_wrap_and_backward[eager] | 1.4860ms | 1.3645ms | 732.8913 Ops/s | 679.7189 Ops/s | |
| test_mod_wrap_and_backward[compile] | 1.3786ms | 1.2627ms | 791.9331 Ops/s | 716.0307 Ops/s | |
| test_mod_wrap_and_backward[compile-overhead] | 1.3612ms | 0.9302ms | 1.0750 KOps/s | 964.5892 Ops/s | |
| test_seq_add[eager] | 0.1443ms | 99.8794μs | 10.0121 KOps/s | 9.8580 KOps/s | |
| test_seq_add[compile] | 0.2508ms | 91.0381μs | 10.9844 KOps/s | 11.2994 KOps/s | |
| test_seq_add[compile-overhead] | 0.1772ms | 0.1263ms | 7.9198 KOps/s | 7.7368 KOps/s | |
| test_seq_wrap[eager] | 0.4641ms | 0.3932ms | 2.5430 KOps/s | 2.5638 KOps/s | |
| test_seq_wrap[compile] | 0.3578ms | 0.3018ms | 3.3134 KOps/s | 3.2406 KOps/s | |
| test_seq_wrap[compile-overhead] | 0.2721ms | 0.2248ms | 4.4476 KOps/s | 4.4381 KOps/s | |
| test_func_call_runtime[False-eager] | 0.8198ms | 0.7439ms | 1.3443 KOps/s | 1.3104 KOps/s | |
| test_func_call_runtime[False-compile] | 0.7960ms | 0.7429ms | 1.3461 KOps/s | 1.3210 KOps/s | |
| test_func_call_runtime[False-compile-overhead] | 0.4266ms | 0.3625ms | 2.7590 KOps/s | 2.7382 KOps/s | |
| test_func_call_runtime[True-eager] | 0.9994ms | 0.9076ms | 1.1018 KOps/s | 1.0707 KOps/s | |
| test_func_call_runtime[True-compile] | 0.8070ms | 0.7650ms | 1.3072 KOps/s | 1.2818 KOps/s | |
| test_func_call_runtime[True-compile-overhead] | 0.4338ms | 0.3841ms | 2.6037 KOps/s | 2.5822 KOps/s | |
| test_func_call_cm_runtime[False-eager] | 0.7938ms | 0.7399ms | 1.3515 KOps/s | 1.3117 KOps/s | |
| test_func_call_cm_runtime[False-compile] | 0.7989ms | 0.7478ms | 1.3373 KOps/s | 1.3088 KOps/s | |
| test_func_call_cm_runtime[False-compile-overhead] | 0.4333ms | 0.3638ms | 2.7488 KOps/s | 2.7212 KOps/s | |
| test_func_call_cm_runtime[True-eager] | 1.1004ms | 1.0068ms | 993.2470 Ops/s | 970.0565 Ops/s | |
| test_func_call_cm_runtime[True-compile] | 0.8319ms | 0.7927ms | 1.2615 KOps/s | 1.2298 KOps/s | |
| test_func_call_cm_runtime[True-compile-overhead] | 0.4706ms | 0.4103ms | 2.4372 KOps/s | 2.3956 KOps/s | |
| test_vmap_func_call_cm_runtime[eager] | 2.5859ms | 2.1093ms | 474.0832 Ops/s | 471.2747 Ops/s | |
| test_vmap_func_call_cm_runtime[compile] | 0.9460ms | 0.8083ms | 1.2371 KOps/s | 1.2053 KOps/s | |
| test_vmap_func_call_cm_runtime[compile-overhead] | 0.5125ms | 0.4113ms | 2.4315 KOps/s | 2.4133 KOps/s | |
| test_distributed | 2.8343ms | 0.1838ms | 5.4419 KOps/s | 8.7668 KOps/s | |
| test_tdmodule | 0.9226ms | 14.4710μs | 69.1035 KOps/s | 72.0395 KOps/s | |
| test_tdmodule_dispatch | 72.3210μs | 29.2622μs | 34.1738 KOps/s | 36.1724 KOps/s | |
| test_tdseq | 27.8810μs | 16.2286μs | 61.6195 KOps/s | 64.2071 KOps/s | |
| test_tdseq_dispatch | 52.7810μs | 32.1975μs | 31.0583 KOps/s | 32.1993 KOps/s | |
| test_instantiation_functorch | 1.7289ms | 1.6248ms | 615.4744 Ops/s | 626.9616 Ops/s | |
| test_exec_functorch | 0.1971ms | 0.1497ms | 6.6783 KOps/s | 6.6355 KOps/s | |
| test_exec_functional_call | 0.1806ms | 0.1449ms | 6.9002 KOps/s | 6.9219 KOps/s | |
| test_exec_td_decorator | 0.3659ms | 0.1821ms | 5.4907 KOps/s | 5.3297 KOps/s | |
| test_vmap_mlp_speed_decorator[True-True] | 0.7758ms | 0.6758ms | 1.4798 KOps/s | 1.4580 KOps/s | |
| test_vmap_mlp_speed_decorator[True-False] | 0.8314ms | 0.6761ms | 1.4791 KOps/s | 1.4551 KOps/s | |
| test_vmap_mlp_speed_decorator[False-True] | 0.7491ms | 0.6028ms | 1.6590 KOps/s | 1.6570 KOps/s | |
| test_vmap_mlp_speed_decorator[False-False] | 0.7091ms | 0.5959ms | 1.6782 KOps/s | 1.6532 KOps/s | |
| test_vmap_transformer_speed_decorator[True-True] | 19.3402ms | 19.2319ms | 51.9969 Ops/s | 51.6734 Ops/s | |
| test_vmap_transformer_speed_decorator[True-False] | 19.3835ms | 19.2895ms | 51.8417 Ops/s | 51.5756 Ops/s | |
| test_vmap_transformer_speed_decorator[False-True] | 19.8917ms | 19.2493ms | 51.9498 Ops/s | 52.0376 Ops/s | |
| test_vmap_transformer_speed_decorator[False-False] | 19.2595ms | 19.1625ms | 52.1854 Ops/s | 51.9438 Ops/s | |
| test_to_module_speed[True] | 2.2034ms | 0.9575ms | 1.0444 KOps/s | 1.0380 KOps/s | |
| test_to_module_speed[False] | 1.0440ms | 0.9362ms | 1.0682 KOps/s | 1.0606 KOps/s | |
| test_tc_init | 77.0220μs | 36.2066μs | 27.6193 KOps/s | 27.1933 KOps/s | |
| test_tc_init_nested | 0.1061ms | 72.0913μs | 13.8713 KOps/s | 13.5382 KOps/s | |
| test_tc_first_layer_tensor | 13.2560μs | 0.7410μs | 1.3495 MOps/s | 1.3486 MOps/s | |
| test_tc_first_layer_nontensor | 21.9100μs | 2.5443μs | 393.0297 KOps/s | 407.7526 KOps/s | |
| test_tc_second_layer_tensor | 43.4777μs | 1.5003μs | 666.5185 KOps/s | 655.1570 KOps/s | |
| test_tc_second_layer_nontensor | 23.4510μs | 3.3213μs | 301.0862 KOps/s | 309.8165 KOps/s | |
| test_unbind | 0.2150s | 9.7356ms | 102.7162 Ops/s | 146.1191 Ops/s | |
| test_full_like | 11.7402ms | 9.2608ms | 107.9824 Ops/s | 107.2714 Ops/s | |
| test_zeros_like | 4.9638ms | 4.2592ms | 234.7844 Ops/s | 238.9750 Ops/s | |
| test_ones_like | 4.9422ms | 4.3363ms | 230.6127 Ops/s | 230.7957 Ops/s | |
| test_clone | 6.9231ms | 6.4614ms | 154.7657 Ops/s | 108.2046 Ops/s | |
| test_squeeze | 63.8920μs | 9.5019μs | 105.2425 KOps/s | 103.8334 KOps/s | |
| test_unsqueeze | 0.1202ms | 71.5794μs | 13.9705 KOps/s | 13.4251 KOps/s | |
| test_split | 0.2963ms | 0.1596ms | 6.2659 KOps/s | 6.0522 KOps/s | |
| test_permute | 0.2186ms | 0.1783ms | 5.6094 KOps/s | 5.3967 KOps/s | |
| test_stack | 51.9027ms | 50.9478ms | 19.6279 Ops/s | 19.5201 Ops/s | |
| test_cat | 51.0426ms | 50.7232ms | 19.7148 Ops/s | 19.6579 Ops/s |
Sign up for free
to join this conversation on GitHub.
Already have an account?
Sign in to comment
Labels
CLA Signed
This label is managed by the Facebook bot. Authors need to sign the CLA before a PR can be reviewed.
Add this suggestion to a batch that can be applied as a single commit.
This suggestion is invalid because no changes were made to the code.
Suggestions cannot be applied while the pull request is closed.
Suggestions cannot be applied while viewing a subset of changes.
Only one suggestion per line can be applied in a batch.
Add this suggestion to a batch that can be applied as a single commit.
Applying suggestions on deleted lines is not supported.
You must change the existing code in this line in order to create a valid suggestion.
Outdated suggestions cannot be applied.
This suggestion has been applied or marked resolved.
Suggestions cannot be applied from pending reviews.
Suggestions cannot be applied on multi-line comments.
Suggestions cannot be applied while the pull request is queued to merge.
Suggestion cannot be applied right now. Please check back later.
Stack from ghstack (oldest at bottom):