-
Notifications
You must be signed in to change notification settings - Fork 108
[BugFix] TDParams.to(device) works as nn.Module, not TDParams contained TD #1025
New issue
Have a question about this project? Sign up for a free GitHub account to open an issue and contact its maintainers and the community.
By clicking “Sign up for GitHub”, you agree to our terms of service and privacy statement. We’ll occasionally send you account related emails.
Already on GitHub? Sign in to your account
Merged
Conversation
This file contains hidden or bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
|
| Name | Max | Mean | Ops | Ops on Repo HEAD
|
Change |
|---|---|---|---|---|---|
| test_plain_set_nested | 50.2940μs | 25.6590μs | 38.9727 KOps/s | 39.7246 KOps/s | |
| test_plain_set_stack_nested | 61.4650μs | 26.6035μs | 37.5890 KOps/s | 39.3695 KOps/s | |
| test_plain_set_nested_inplace | 74.0390μs | 28.2549μs | 35.3921 KOps/s | 35.6244 KOps/s | |
| test_plain_set_stack_nested_inplace | 77.1640μs | 28.4961μs | 35.0925 KOps/s | 35.9643 KOps/s | |
| test_items | 28.0020μs | 4.3045μs | 232.3142 KOps/s | 237.3400 KOps/s | |
| test_items_nested | 0.9308ms | 0.3895ms | 2.5671 KOps/s | 2.5107 KOps/s | |
| test_items_nested_locked | 0.7881ms | 0.3811ms | 2.6240 KOps/s | 2.5526 KOps/s | |
| test_items_nested_leaf | 0.1674ms | 80.7126μs | 12.3896 KOps/s | 12.3998 KOps/s | |
| test_items_stack_nested | 0.8774ms | 0.3842ms | 2.6027 KOps/s | 2.5504 KOps/s | |
| test_items_stack_nested_leaf | 0.2003ms | 83.9522μs | 11.9115 KOps/s | 11.8197 KOps/s | |
| test_items_stack_nested_locked | 0.6223ms | 0.3838ms | 2.6058 KOps/s | 2.5473 KOps/s | |
| test_keys | 30.2760μs | 3.5724μs | 279.9232 KOps/s | 282.2615 KOps/s | |
| test_keys_nested | 0.2503ms | 0.1362ms | 7.3402 KOps/s | 7.2897 KOps/s | |
| test_keys_nested_locked | 0.7267ms | 0.1419ms | 7.0482 KOps/s | 7.0427 KOps/s | |
| test_keys_nested_leaf | 0.2266ms | 0.1195ms | 8.3706 KOps/s | 8.3613 KOps/s | |
| test_keys_stack_nested | 0.2194ms | 0.1365ms | 7.3278 KOps/s | 7.4007 KOps/s | |
| test_keys_stack_nested_leaf | 0.1978ms | 0.1186ms | 8.4310 KOps/s | 8.5274 KOps/s | |
| test_keys_stack_nested_locked | 0.2589ms | 0.1414ms | 7.0721 KOps/s | 7.1515 KOps/s | |
| test_values | 6.8950μs | 1.0647μs | 939.1974 KOps/s | 925.7938 KOps/s | |
| test_values_nested | 0.1609ms | 95.1262μs | 10.5123 KOps/s | 10.5073 KOps/s | |
| test_values_nested_locked | 0.1578ms | 94.4815μs | 10.5841 KOps/s | 10.4701 KOps/s | |
| test_values_nested_leaf | 0.1447ms | 81.1289μs | 12.3261 KOps/s | 12.2421 KOps/s | |
| test_values_stack_nested | 0.1729ms | 95.0095μs | 10.5253 KOps/s | 10.4723 KOps/s | |
| test_values_stack_nested_leaf | 0.2921ms | 83.1363μs | 12.0284 KOps/s | 11.9707 KOps/s | |
| test_values_stack_nested_locked | 0.1736ms | 96.1602μs | 10.3993 KOps/s | 10.5424 KOps/s | |
| test_membership | 15.4690μs | 0.8862μs | 1.1284 MOps/s | 1.3151 MOps/s | |
| test_membership_nested | 31.9490μs | 2.7778μs | 360.0000 KOps/s | 357.3488 KOps/s | |
| test_membership_nested_leaf | 29.8660μs | 2.8004μs | 357.0934 KOps/s | 355.6549 KOps/s | |
| test_membership_stacked_nested | 34.6350μs | 2.8081μs | 356.1112 KOps/s | 355.2089 KOps/s | |
| test_membership_stacked_nested_leaf | 29.0140μs | 2.7948μs | 357.8133 KOps/s | 357.1981 KOps/s | |
| test_membership_nested_last | 40.6760μs | 4.3134μs | 231.8352 KOps/s | 232.8526 KOps/s | |
| test_membership_nested_leaf_last | 45.1140μs | 4.2939μs | 232.8864 KOps/s | 232.6466 KOps/s | |
| test_membership_stacked_nested_last | 31.1180μs | 5.2784μs | 189.4503 KOps/s | 165.9311 KOps/s | |
| test_membership_stacked_nested_leaf_last | 41.9380μs | 5.1274μs | 195.0319 KOps/s | 167.1690 KOps/s | |
| test_nested_getleaf | 0.2023ms | 10.7758μs | 92.8007 KOps/s | 94.7035 KOps/s | |
| test_nested_get | 33.9130μs | 10.5453μs | 94.8292 KOps/s | 99.5428 KOps/s | |
| test_stacked_getleaf | 35.5570μs | 10.3817μs | 96.3238 KOps/s | 94.8991 KOps/s | |
| test_stacked_get | 44.8030μs | 10.4260μs | 95.9144 KOps/s | 99.2752 KOps/s | |
| test_nested_getitemleaf | 32.8920μs | 11.5634μs | 86.4794 KOps/s | 91.5158 KOps/s | |
| test_nested_getitem | 97.5520μs | 10.0491μs | 99.5118 KOps/s | 97.9059 KOps/s | |
| test_stacked_getitemleaf | 41.7380μs | 11.3045μs | 88.4602 KOps/s | 91.4027 KOps/s | |
| test_stacked_getitem | 37.0790μs | 10.7066μs | 93.4005 KOps/s | 98.3284 KOps/s | |
| test_lock_nested | 85.5881ms | 0.5915ms | 1.6906 KOps/s | 1.9882 KOps/s | |
| test_lock_stack_nested | 0.9293ms | 0.4794ms | 2.0858 KOps/s | 2.1717 KOps/s | |
| test_unlock_nested | 91.6418ms | 0.5132ms | 1.9486 KOps/s | 2.3850 KOps/s | |
| test_unlock_stack_nested | 0.6124ms | 0.3901ms | 2.5632 KOps/s | 2.6486 KOps/s | |
| test_flatten_speed | 0.6342ms | 0.1029ms | 9.7212 KOps/s | 10.1688 KOps/s | |
| test_unflatten_speed | 0.6344ms | 0.5258ms | 1.9018 KOps/s | 1.9418 KOps/s | |
| test_common_ops | 5.5903ms | 1.1876ms | 842.0308 Ops/s | 868.9657 Ops/s | |
| test_creation | 25.3880μs | 2.1204μs | 471.6090 KOps/s | 490.7029 KOps/s | |
| test_creation_empty | 47.1980μs | 20.6255μs | 48.4836 KOps/s | 52.5381 KOps/s | |
| test_creation_nested_1 | 92.9730μs | 23.9604μs | 41.7355 KOps/s | 44.7458 KOps/s | |
| test_creation_nested_2 | 67.2650μs | 28.2217μs | 35.4338 KOps/s | 37.4512 KOps/s | |
| test_clone | 0.1756ms | 18.0360μs | 55.4446 KOps/s | 58.7312 KOps/s | |
| test_getitem[int] | 1.2652ms | 17.1530μs | 58.2990 KOps/s | 55.2242 KOps/s | |
| test_getitem[slice_int] | 0.1383ms | 32.4025μs | 30.8618 KOps/s | 32.5553 KOps/s | |
| test_getitem[range] | 0.1974ms | 61.0342μs | 16.3843 KOps/s | 17.5390 KOps/s | |
| test_getitem[tuple] | 0.1478ms | 25.7932μs | 38.7700 KOps/s | 39.2534 KOps/s | |
| test_getitem[list] | 0.1896ms | 55.6405μs | 17.9725 KOps/s | 19.1793 KOps/s | |
| test_setitem_dim[int] | 66.5130μs | 33.9364μs | 29.4669 KOps/s | 31.1269 KOps/s | |
| test_setitem_dim[slice_int] | 0.1202ms | 63.0320μs | 15.8649 KOps/s | 16.2634 KOps/s | |
| test_setitem_dim[range] | 0.1439ms | 86.4596μs | 11.5661 KOps/s | 11.8403 KOps/s | |
| test_setitem_dim[tuple] | 76.4130μs | 50.8861μs | 19.6517 KOps/s | 20.3712 KOps/s | |
| test_setitem | 89.9780μs | 31.8247μs | 31.4221 KOps/s | 33.6142 KOps/s | |
| test_set | 0.2832ms | 31.7483μs | 31.4978 KOps/s | 33.9207 KOps/s | |
| test_set_shared | 2.5235ms | 0.2251ms | 4.4434 KOps/s | 4.6486 KOps/s | |
| test_update | 0.1408ms | 40.4316μs | 24.7332 KOps/s | 26.2358 KOps/s | |
| test_update_nested | 0.1509ms | 51.9748μs | 19.2401 KOps/s | 19.7761 KOps/s | |
| test_update__nested | 0.1391ms | 39.3834μs | 25.3914 KOps/s | 27.0556 KOps/s | |
| test_set_nested | 0.1046ms | 34.2631μs | 29.1859 KOps/s | 30.9160 KOps/s | |
| test_set_nested_new | 0.1461ms | 38.5546μs | 25.9372 KOps/s | 26.3869 KOps/s | |
| test_select | 0.6559ms | 56.1477μs | 17.8102 KOps/s | 18.1215 KOps/s | |
| test_select_nested | 0.1510ms | 60.2731μs | 16.5911 KOps/s | 16.5598 KOps/s | |
| test_exclude_nested | 0.1437ms | 75.6725μs | 13.2148 KOps/s | 13.2669 KOps/s | |
| test_empty[True] | 1.1479ms | 0.3594ms | 2.7821 KOps/s | 2.7933 KOps/s | |
| test_empty[False] | 6.2517μs | 1.2326μs | 811.3142 KOps/s | 815.8795 KOps/s | |
| test_unbind_speed | 0.3927ms | 0.3065ms | 3.2630 KOps/s | 3.3194 KOps/s | |
| test_unbind_speed_stack0 | 0.4064ms | 0.3020ms | 3.3108 KOps/s | 3.4532 KOps/s | |
| test_unbind_speed_stack1 | 87.4237ms | 0.8805ms | 1.1358 KOps/s | 1.4945 KOps/s | |
| test_split | 91.8885ms | 2.1977ms | 455.0199 Ops/s | 459.0423 Ops/s | |
| test_chunk | 2.2267ms | 2.0269ms | 493.3619 Ops/s | 462.1634 Ops/s | |
| test_creation[device0] | 0.2225ms | 0.1161ms | 8.6125 KOps/s | 8.5843 KOps/s | |
| test_creation_from_tensor | 2.0801ms | 0.1164ms | 8.5882 KOps/s | 8.5073 KOps/s | |
| test_add_one[memmap_tensor0] | 0.3599ms | 7.7686μs | 128.7236 KOps/s | 143.9164 KOps/s | |
| test_contiguous[memmap_tensor0] | 19.1160μs | 1.9067μs | 524.4565 KOps/s | 527.3610 KOps/s | |
| test_stack[memmap_tensor0] | 68.6980μs | 5.8235μs | 171.7169 KOps/s | 180.5322 KOps/s | |
| test_memmaptd_index | 1.1263ms | 0.4154ms | 2.4070 KOps/s | 2.4104 KOps/s | |
| test_memmaptd_index_astensor | 1.0563ms | 0.5212ms | 1.9185 KOps/s | 1.9405 KOps/s | |
| test_memmaptd_index_op | 5.6670ms | 1.1262ms | 887.9147 Ops/s | 945.1342 Ops/s | |
| test_serialize_model | 0.1240s | 0.1170s | 8.5461 Ops/s | 8.2200 Ops/s | |
| test_serialize_model_pickle | 0.4441s | 0.3886s | 2.5734 Ops/s | 2.5381 Ops/s | |
| test_serialize_weights | 0.1313s | 0.1171s | 8.5399 Ops/s | 8.5578 Ops/s | |
| test_serialize_weights_returnearly | 0.1842s | 0.1626s | 6.1500 Ops/s | 6.3035 Ops/s | |
| test_serialize_weights_pickle | 0.4621s | 0.4064s | 2.4604 Ops/s | 2.4326 Ops/s | |
| test_serialize_weights_filesystem | 0.2402s | 0.1542s | 6.4870 Ops/s | 6.8730 Ops/s | |
| test_serialize_model_filesystem | 0.1541s | 0.1490s | 6.7136 Ops/s | 6.1556 Ops/s | |
| test_reshape_pytree | 0.1414ms | 41.0697μs | 24.3488 KOps/s | 25.5210 KOps/s | |
| test_reshape_td | 0.1320ms | 46.6739μs | 21.4253 KOps/s | 21.9653 KOps/s | |
| test_view_pytree | 0.1058ms | 39.1788μs | 25.5240 KOps/s | 25.6152 KOps/s | |
| test_view_td | 0.1037ms | 51.3311μs | 19.4814 KOps/s | 19.5117 KOps/s | |
| test_unbind_pytree | 0.1275ms | 36.4839μs | 27.4094 KOps/s | 28.1216 KOps/s | |
| test_unbind_td | 0.3080ms | 45.3722μs | 22.0399 KOps/s | 22.4313 KOps/s | |
| test_split_pytree | 74.8000μs | 38.5272μs | 25.9557 KOps/s | 26.3532 KOps/s | |
| test_split_td | 0.4819ms | 57.2293μs | 17.4736 KOps/s | 17.6004 KOps/s | |
| test_add_pytree | 95.7280μs | 46.4507μs | 21.5282 KOps/s | 23.0029 KOps/s | |
| test_add_td | 0.1824ms | 90.7191μs | 11.0230 KOps/s | 11.8582 KOps/s | |
| test_compile_add_one_nested[tensordict-compile] | 0.1763ms | 57.1158μs | 17.5083 KOps/s | 16.5608 KOps/s | |
| test_compile_add_one_nested[tensordict-eager] | 0.3487ms | 0.1928ms | 5.1854 KOps/s | 5.1202 KOps/s | |
| test_compile_add_one_nested[pytree-compile] | 0.1754ms | 56.2543μs | 17.7764 KOps/s | 17.9296 KOps/s | |
| test_compile_add_one_nested[pytree-eager] | 0.2672ms | 0.1427ms | 7.0055 KOps/s | 7.2740 KOps/s | |
| test_compile_copy_nested[tensordict-compile] | 62.4860μs | 23.5347μs | 42.4904 KOps/s | 43.6455 KOps/s | |
| test_compile_copy_nested[tensordict-eager] | 0.1412ms | 75.0062μs | 13.3322 KOps/s | 13.4119 KOps/s | |
| test_compile_copy_nested[pytree-compile] | 0.1382ms | 74.7134μs | 13.3845 KOps/s | 13.0764 KOps/s | |
| test_compile_copy_nested[pytree-eager] | 0.1801ms | 68.2873μs | 14.6440 KOps/s | 14.4227 KOps/s | |
| test_compile_add_one_flat[tensordict-compile] | 0.3709ms | 0.1825ms | 5.4803 KOps/s | 5.5401 KOps/s | |
| test_compile_add_one_flat[tensordict-eager] | 0.4474ms | 0.2356ms | 4.2450 KOps/s | 4.1395 KOps/s | |
| test_compile_add_one_flat[tensorclass-compile] | 0.1176ms | 46.6427μs | 21.4396 KOps/s | 20.8548 KOps/s | |
| test_compile_add_one_flat[tensorclass-eager] | 0.1557ms | 78.0925μs | 12.8053 KOps/s | 12.9536 KOps/s | |
| test_compile_add_one_flat[pytree-compile] | 0.4995ms | 0.1792ms | 5.5818 KOps/s | 5.7744 KOps/s | |
| test_compile_add_one_flat[pytree-eager] | 0.5872ms | 0.2941ms | 3.4004 KOps/s | 3.5252 KOps/s | |
| test_compile_add_self_flat[tensordict-eager] | 0.5891ms | 0.2726ms | 3.6683 KOps/s | 3.6624 KOps/s | |
| test_compile_add_self_flat[tensordict-compile] | 0.9371ms | 0.1888ms | 5.2974 KOps/s | 5.5461 KOps/s | |
| test_compile_add_self_flat[tensorclass-eager] | 0.2469ms | 74.6299μs | 13.3995 KOps/s | 13.6509 KOps/s | |
| test_compile_add_self_flat[tensorclass-compile] | 0.1084ms | 48.1405μs | 20.7725 KOps/s | 20.4421 KOps/s | |
| test_compile_add_self_flat[pytree-eager] | 0.3997ms | 0.2325ms | 4.3014 KOps/s | 4.3389 KOps/s | |
| test_compile_add_self_flat[pytree-compile] | 0.4011ms | 0.1759ms | 5.6864 KOps/s | 5.5817 KOps/s | |
| test_compile_copy_flat[tensordict-compile] | 0.2084ms | 0.1129ms | 8.8610 KOps/s | 8.9733 KOps/s | |
| test_compile_copy_flat[tensordict-eager] | 0.1562ms | 79.3523μs | 12.6020 KOps/s | 12.4885 KOps/s | |
| test_compile_copy_flat[pytree-compile] | 0.1710ms | 77.2631μs | 12.9428 KOps/s | 12.6718 KOps/s | |
| test_compile_copy_flat[pytree-eager] | 0.6479ms | 68.1010μs | 14.6841 KOps/s | 13.7423 KOps/s | |
| test_compile_assign_and_add[tensordict-compile] | 0.5004ms | 0.1980ms | 5.0503 KOps/s | 5.1542 KOps/s | |
| test_compile_assign_and_add[tensordict-eager] | 2.8045ms | 1.7538ms | 570.1850 Ops/s | 565.7420 Ops/s | |
| test_compile_assign_and_add[pytree-compile] | 0.3795ms | 0.1895ms | 5.2778 KOps/s | 5.2448 KOps/s | |
| test_compile_assign_and_add[pytree-eager] | 1.3495ms | 1.1091ms | 901.6145 Ops/s | 925.4348 Ops/s | |
| test_compile_assign_and_add_stack[compile] | 0.7620ms | 0.4191ms | 2.3863 KOps/s | 2.4154 KOps/s | |
| test_compile_assign_and_add_stack[eager] | 7.2337ms | 4.2343ms | 236.1672 Ops/s | 249.5010 Ops/s | |
| test_compile_indexing[tensor-tensordict-compile] | 0.1174ms | 33.9847μs | 29.4250 KOps/s | 28.8533 KOps/s | |
| test_compile_indexing[tensor-tensordict-eager] | 1.4751ms | 50.0074μs | 19.9970 KOps/s | 21.1101 KOps/s | |
| test_compile_indexing[tensor-tensorclass-compile] | 81.9630μs | 29.7875μs | 33.5711 KOps/s | 34.8536 KOps/s | |
| test_compile_indexing[tensor-tensorclass-eager] | 0.1368ms | 29.7860μs | 33.5728 KOps/s | 36.0717 KOps/s | |
| test_compile_indexing[tensor-pytree-compile] | 81.4720μs | 29.0051μs | 34.4767 KOps/s | 34.8692 KOps/s | |
| test_compile_indexing[tensor-pytree-eager] | 89.5070μs | 29.7303μs | 33.6357 KOps/s | 35.9627 KOps/s | |
| test_compile_indexing[slice-tensordict-compile] | 0.1379ms | 73.8739μs | 13.5366 KOps/s | 13.5256 KOps/s | |
| test_compile_indexing[slice-tensordict-eager] | 0.6299ms | 28.9423μs | 34.5515 KOps/s | 36.1304 KOps/s | |
| test_compile_indexing[slice-tensorclass-compile] | 0.1468ms | 67.9924μs | 14.7075 KOps/s | 14.9093 KOps/s | |
| test_compile_indexing[slice-tensorclass-eager] | 83.7090μs | 23.7043μs | 42.1864 KOps/s | 43.8710 KOps/s | |
| test_compile_indexing[slice-pytree-compile] | 0.1540ms | 67.9220μs | 14.7228 KOps/s | 14.9347 KOps/s | |
| test_compile_indexing[slice-pytree-eager] | 74.5190μs | 23.4252μs | 42.6891 KOps/s | 43.6565 KOps/s | |
| test_compile_indexing[int-tensordict-compile] | 0.1317ms | 74.0532μs | 13.5038 KOps/s | 13.7455 KOps/s | |
| test_compile_indexing[int-tensordict-eager] | 1.3073ms | 28.2987μs | 35.3373 KOps/s | 36.9581 KOps/s | |
| test_compile_indexing[int-tensorclass-compile] | 0.1446ms | 68.3881μs | 14.6224 KOps/s | 14.9664 KOps/s | |
| test_compile_indexing[int-tensorclass-eager] | 79.2500μs | 23.5089μs | 42.5372 KOps/s | 43.6507 KOps/s | |
| test_compile_indexing[int-pytree-compile] | 0.1340ms | 67.9478μs | 14.7172 KOps/s | 14.9927 KOps/s | |
| test_compile_indexing[int-pytree-eager] | 94.8770μs | 23.9473μs | 41.7584 KOps/s | 44.1714 KOps/s | |
| test_mod_add[eager] | 0.1145ms | 27.3884μs | 36.5118 KOps/s | 37.7922 KOps/s | |
| test_mod_add[compile] | 86.8120μs | 38.0252μs | 26.2983 KOps/s | 26.2431 KOps/s | |
| test_mod_add[compile-overhead] | 97.1110μs | 38.0142μs | 26.3059 KOps/s | 26.3587 KOps/s | |
| test_mod_wrap[eager] | 0.4261ms | 0.2147ms | 4.6566 KOps/s | 4.7991 KOps/s | |
| test_mod_wrap[compile] | 0.3334ms | 0.2291ms | 4.3640 KOps/s | 4.3634 KOps/s | |
| test_mod_wrap[compile-overhead] | 0.4360ms | 0.2300ms | 4.3482 KOps/s | 4.3812 KOps/s | |
| test_mod_wrap_and_backward[eager] | 13.0784ms | 11.2141ms | 89.1736 Ops/s | 87.1064 Ops/s | |
| test_mod_wrap_and_backward[compile] | 12.3796ms | 11.0682ms | 90.3492 Ops/s | 82.8059 Ops/s | |
| test_mod_wrap_and_backward[compile-overhead] | 12.0289ms | 11.2810ms | 88.6443 Ops/s | 82.7064 Ops/s | |
| test_seq_add[eager] | 0.1876ms | 94.7983μs | 10.5487 KOps/s | 10.8268 KOps/s | |
| test_seq_add[compile] | 0.1436ms | 64.6124μs | 15.4769 KOps/s | 15.2638 KOps/s | |
| test_seq_add[compile-overhead] | 0.1276ms | 63.6710μs | 15.7057 KOps/s | 15.6348 KOps/s | |
| test_seq_wrap[eager] | 0.6547ms | 0.3957ms | 2.5274 KOps/s | 2.5584 KOps/s | |
| test_seq_wrap[compile] | 1.3905ms | 0.2684ms | 3.7255 KOps/s | 3.7084 KOps/s | |
| test_seq_wrap[compile-overhead] | 1.5264ms | 0.2662ms | 3.7571 KOps/s | 3.7090 KOps/s | |
| test_func_call_runtime[False-eager] | 1.8250ms | 0.5429ms | 1.8418 KOps/s | 1.8848 KOps/s | |
| test_func_call_runtime[False-compile] | 0.6244ms | 0.4983ms | 2.0067 KOps/s | 2.0205 KOps/s | |
| test_func_call_runtime[False-compile-overhead] | 0.7075ms | 0.4987ms | 2.0054 KOps/s | 2.0204 KOps/s | |
| test_func_call_runtime[True-eager] | 0.9665ms | 0.7525ms | 1.3288 KOps/s | 1.3223 KOps/s | |
| test_func_call_runtime[True-compile] | 1.1494ms | 0.5123ms | 1.9521 KOps/s | 1.9713 KOps/s | |
| test_func_call_runtime[True-compile-overhead] | 0.6751ms | 0.5069ms | 1.9726 KOps/s | 1.9739 KOps/s | |
| test_func_call_cm_runtime[False-eager] | 0.9471ms | 0.5352ms | 1.8686 KOps/s | 1.8824 KOps/s | |
| test_func_call_cm_runtime[False-compile] | 0.5870ms | 0.4958ms | 2.0171 KOps/s | 2.0045 KOps/s | |
| test_func_call_cm_runtime[False-compile-overhead] | 0.9380ms | 0.4953ms | 2.0191 KOps/s | 2.0064 KOps/s | |
| test_func_call_cm_runtime[True-eager] | 1.0336ms | 0.8767ms | 1.1406 KOps/s | 1.1179 KOps/s | |
| test_func_call_cm_runtime[True-compile] | 0.8547ms | 0.7392ms | 1.3529 KOps/s | 1.3360 KOps/s | |
| test_func_call_cm_runtime[True-compile-overhead] | 1.4661ms | 0.7460ms | 1.3405 KOps/s | 1.3254 KOps/s | |
| test_vmap_func_call_cm_runtime[eager] | 2.6362ms | 1.9078ms | 524.1749 Ops/s | 527.0870 Ops/s | |
| test_vmap_func_call_cm_runtime[compile] | 2.6314ms | 1.9402ms | 515.4225 Ops/s | 517.9405 Ops/s | |
| test_vmap_func_call_cm_runtime[compile-overhead] | 2.5640ms | 1.9464ms | 513.7808 Ops/s | 512.2776 Ops/s | |
| test_distributed | 0.3460ms | 0.1246ms | 8.0274 KOps/s | 7.8765 KOps/s | |
| test_tdmodule | 87.5440μs | 18.8261μs | 53.1178 KOps/s | 54.7892 KOps/s | |
| test_tdmodule_dispatch | 69.4700μs | 38.5186μs | 25.9615 KOps/s | 27.1672 KOps/s | |
| test_tdseq | 47.0380μs | 21.4786μs | 46.5579 KOps/s | 47.5234 KOps/s | |
| test_tdseq_dispatch | 68.6480μs | 43.5622μs | 22.9557 KOps/s | 23.8964 KOps/s | |
| test_instantiation_functorch | 2.5858ms | 1.5761ms | 634.4782 Ops/s | 633.0916 Ops/s | |
| test_instantiation_td | 1.9630ms | 1.1588ms | 862.9654 Ops/s | 840.4175 Ops/s | |
| test_exec_functorch | 0.3740ms | 0.1850ms | 5.4041 KOps/s | 5.4588 KOps/s | |
| test_exec_functional_call | 0.2695ms | 0.1714ms | 5.8355 KOps/s | 5.7353 KOps/s | |
| test_exec_td | 0.2889ms | 0.1939ms | 5.1578 KOps/s | 5.0822 KOps/s | |
| test_exec_td_decorator | 1.1015ms | 0.2278ms | 4.3896 KOps/s | 4.2734 KOps/s | |
| test_vmap_mlp_speed[True-True] | 0.9682ms | 0.6930ms | 1.4429 KOps/s | 1.4644 KOps/s | |
| test_vmap_mlp_speed[True-False] | 1.7824ms | 0.6897ms | 1.4498 KOps/s | 1.4774 KOps/s | |
| test_vmap_mlp_speed[False-True] | 0.8393ms | 0.5374ms | 1.8607 KOps/s | 1.8778 KOps/s | |
| test_vmap_mlp_speed[False-False] | 0.8484ms | 0.5397ms | 1.8530 KOps/s | 1.8314 KOps/s | |
| test_vmap_mlp_speed_decorator[True-True] | 1.4495ms | 0.6526ms | 1.5323 KOps/s | 1.5671 KOps/s | |
| test_vmap_mlp_speed_decorator[True-False] | 1.0024ms | 0.6496ms | 1.5394 KOps/s | 1.5642 KOps/s | |
| test_vmap_mlp_speed_decorator[False-True] | 0.7731ms | 0.5430ms | 1.8417 KOps/s | 1.8775 KOps/s | |
| test_vmap_mlp_speed_decorator[False-False] | 0.8066ms | 0.5352ms | 1.8685 KOps/s | 1.8760 KOps/s | |
| test_to_module_speed[True] | 2.2614ms | 1.3870ms | 720.9933 Ops/s | 711.8564 Ops/s | |
| test_to_module_speed[False] | 1.9719ms | 1.3395ms | 746.5603 Ops/s | 733.5302 Ops/s | |
| test_tc_init | 0.1316ms | 48.6917μs | 20.5374 KOps/s | 21.6872 KOps/s | |
| test_tc_init_nested | 0.1873ms | 98.3450μs | 10.1683 KOps/s | 10.6785 KOps/s | |
| test_tc_first_layer_tensor | 25.6180μs | 1.5403μs | 649.2220 KOps/s | 638.9640 KOps/s | |
| test_tc_first_layer_nontensor | 37.9410μs | 4.6426μs | 215.3955 KOps/s | 208.6821 KOps/s | |
| test_tc_second_layer_tensor | 0.5229ms | 2.9605μs | 337.7789 KOps/s | 353.6514 KOps/s | |
| test_tc_second_layer_nontensor | 71.6160μs | 6.1230μs | 163.3193 KOps/s | 162.8136 KOps/s | |
| test_unbind | 0.4917s | 13.5060ms | 74.0413 Ops/s | 133.9990 Ops/s | |
| test_full_like | 12.7031ms | 8.9402ms | 111.8546 Ops/s | 134.7268 Ops/s | |
| test_zeros_like | 4.2426ms | 3.2425ms | 308.4059 Ops/s | 328.3290 Ops/s | |
| test_ones_like | 3.8321ms | 3.4734ms | 287.9057 Ops/s | 268.1910 Ops/s | |
| test_clone | 7.6593ms | 5.9029ms | 169.4069 Ops/s | 181.1152 Ops/s | |
| test_squeeze | 66.0330μs | 12.6548μs | 79.0212 KOps/s | 79.6803 KOps/s | |
| test_unsqueeze | 0.1682ms | 91.1345μs | 10.9728 KOps/s | 11.0485 KOps/s | |
| test_split | 0.5718ms | 0.1966ms | 5.0875 KOps/s | 5.1062 KOps/s | |
| test_permute | 0.5429ms | 0.2258ms | 4.4290 KOps/s | 4.4288 KOps/s | |
| test_stack | 29.2303ms | 26.7898ms | 37.3277 Ops/s | 39.8136 Ops/s | |
| test_cat | 31.6836ms | 27.2400ms | 36.7107 Ops/s | 39.9799 Ops/s |
|
| Name | Max | Mean | Ops | Ops on Repo HEAD
|
Change |
|---|---|---|---|---|---|
| test_plain_set_nested | 34.4920μs | 16.3758μs | 61.0656 KOps/s | 58.2013 KOps/s | |
| test_plain_set_stack_nested | 42.1420μs | 16.3616μs | 61.1186 KOps/s | 57.1372 KOps/s | |
| test_plain_set_nested_inplace | 52.6520μs | 17.8211μs | 56.1133 KOps/s | 53.4395 KOps/s | |
| test_plain_set_stack_nested_inplace | 48.9120μs | 17.4865μs | 57.1868 KOps/s | 53.9906 KOps/s | |
| test_items | 28.5920μs | 2.9183μs | 342.6688 KOps/s | 344.6451 KOps/s | |
| test_items_nested | 0.3948ms | 0.3350ms | 2.9848 KOps/s | 2.9699 KOps/s | |
| test_items_nested_locked | 0.5081ms | 0.3368ms | 2.9695 KOps/s | 3.0009 KOps/s | |
| test_items_nested_leaf | 95.0040μs | 62.3608μs | 16.0357 KOps/s | 16.0325 KOps/s | |
| test_items_stack_nested | 0.3809ms | 0.3391ms | 2.9489 KOps/s | 3.0091 KOps/s | |
| test_items_stack_nested_leaf | 96.5050μs | 64.1688μs | 15.5839 KOps/s | 15.9287 KOps/s | |
| test_items_stack_nested_locked | 0.4140ms | 0.3410ms | 2.9325 KOps/s | 2.9993 KOps/s | |
| test_keys | 29.1710μs | 3.4273μs | 291.7776 KOps/s | 290.1280 KOps/s | |
| test_keys_nested | 0.1036ms | 71.0079μs | 14.0829 KOps/s | 14.1379 KOps/s | |
| test_keys_nested_locked | 2.6788ms | 77.2163μs | 12.9506 KOps/s | 12.9241 KOps/s | |
| test_keys_nested_leaf | 0.1022ms | 62.5689μs | 15.9824 KOps/s | 16.1089 KOps/s | |
| test_keys_stack_nested | 0.1368ms | 72.2487μs | 13.8411 KOps/s | 14.0141 KOps/s | |
| test_keys_stack_nested_leaf | 0.1035ms | 63.6495μs | 15.7110 KOps/s | 16.0048 KOps/s | |
| test_keys_stack_nested_locked | 0.1112ms | 77.8847μs | 12.8395 KOps/s | 13.0026 KOps/s | |
| test_values | 5.9487μs | 0.8385μs | 1.1925 MOps/s | 1.1794 MOps/s | |
| test_values_nested | 88.0140μs | 48.3738μs | 20.6724 KOps/s | 20.6487 KOps/s | |
| test_values_nested_locked | 84.9640μs | 49.9276μs | 20.0290 KOps/s | 20.1144 KOps/s | |
| test_values_nested_leaf | 74.2840μs | 42.2605μs | 23.6628 KOps/s | 23.5968 KOps/s | |
| test_values_stack_nested | 81.4930μs | 49.3610μs | 20.2589 KOps/s | 20.5379 KOps/s | |
| test_values_stack_nested_leaf | 79.3840μs | 43.4573μs | 23.0111 KOps/s | 23.2968 KOps/s | |
| test_values_stack_nested_locked | 0.1110ms | 51.2285μs | 19.5204 KOps/s | 19.7016 KOps/s | |
| test_membership | 1.8226μs | 0.5019μs | 1.9924 MOps/s | 1.9945 MOps/s | |
| test_membership_nested | 17.4960μs | 1.8980μs | 526.8648 KOps/s | 528.8577 KOps/s | |
| test_membership_nested_leaf | 10.6607μs | 1.8697μs | 534.8485 KOps/s | 527.2079 KOps/s | |
| test_membership_stacked_nested | 36.2710μs | 1.9732μs | 506.7961 KOps/s | 502.2962 KOps/s | |
| test_membership_stacked_nested_leaf | 29.6910μs | 1.9670μs | 508.3927 KOps/s | 507.4030 KOps/s | |
| test_membership_nested_last | 37.5220μs | 3.0170μs | 331.4518 KOps/s | 331.1635 KOps/s | |
| test_membership_nested_leaf_last | 37.6120μs | 3.0135μs | 331.8387 KOps/s | 324.4984 KOps/s | |
| test_membership_stacked_nested_last | 30.4010μs | 3.0566μs | 327.1636 KOps/s | 322.6258 KOps/s | |
| test_membership_stacked_nested_leaf_last | 38.5320μs | 3.0254μs | 330.5352 KOps/s | 325.7739 KOps/s | |
| test_nested_getleaf | 39.1520μs | 5.9964μs | 166.7654 KOps/s | 164.2596 KOps/s | |
| test_nested_get | 33.7820μs | 5.7276μs | 174.5942 KOps/s | 173.0692 KOps/s | |
| test_stacked_getleaf | 39.5220μs | 6.0514μs | 165.2498 KOps/s | 165.3245 KOps/s | |
| test_stacked_get | 64.2530μs | 5.6551μs | 176.8320 KOps/s | 175.7022 KOps/s | |
| test_nested_getitemleaf | 29.6720μs | 6.1326μs | 163.0623 KOps/s | 160.9446 KOps/s | |
| test_nested_getitem | 37.8820μs | 5.8109μs | 172.0910 KOps/s | 172.8984 KOps/s | |
| test_stacked_getitemleaf | 34.4210μs | 6.1126μs | 163.5976 KOps/s | 164.0680 KOps/s | |
| test_stacked_getitem | 50.4420μs | 5.6855μs | 175.8869 KOps/s | 174.5596 KOps/s | |
| test_lock_nested | 7.0316ms | 0.4327ms | 2.3112 KOps/s | 2.3039 KOps/s | |
| test_lock_stack_nested | 0.4722ms | 0.3908ms | 2.5588 KOps/s | 2.5053 KOps/s | |
| test_unlock_nested | 0.7708ms | 0.3629ms | 2.7554 KOps/s | 2.7227 KOps/s | |
| test_unlock_stack_nested | 0.3787ms | 0.3277ms | 3.0514 KOps/s | 2.9685 KOps/s | |
| test_flatten_speed | 0.1554ms | 75.8846μs | 13.1779 KOps/s | 13.1218 KOps/s | |
| test_unflatten_speed | 0.3842ms | 0.3188ms | 3.1366 KOps/s | 3.0579 KOps/s | |
| test_common_ops | 1.5243ms | 1.2268ms | 815.1286 Ops/s | 768.4649 Ops/s | |
| test_creation | 25.5710μs | 1.4790μs | 676.1146 KOps/s | 674.7252 KOps/s | |
| test_creation_empty | 91.8540μs | 14.7534μs | 67.7811 KOps/s | 59.8238 KOps/s | |
| test_creation_nested_1 | 50.2820μs | 16.4534μs | 60.7778 KOps/s | 54.5568 KOps/s | |
| test_creation_nested_2 | 53.0520μs | 19.0149μs | 52.5903 KOps/s | 47.4516 KOps/s | |
| test_clone | 0.1154ms | 28.7423μs | 34.7919 KOps/s | 35.0529 KOps/s | |
| test_getitem[int] | 1.3410ms | 16.3094μs | 61.3143 KOps/s | 62.5763 KOps/s | |
| test_getitem[slice_int] | 0.1245ms | 27.7525μs | 36.0328 KOps/s | 35.4253 KOps/s | |
| test_getitem[range] | 0.2395ms | 0.1097ms | 9.1154 KOps/s | 9.0363 KOps/s | |
| test_getitem[tuple] | 0.1218ms | 23.7776μs | 42.0565 KOps/s | 40.9022 KOps/s | |
| test_getitem[list] | 0.1959ms | 97.2600μs | 10.2817 KOps/s | 9.5904 KOps/s | |
| test_setitem_dim[int] | 72.7730μs | 43.7194μs | 22.8731 KOps/s | 21.8122 KOps/s | |
| test_setitem_dim[slice_int] | 91.7440μs | 67.1691μs | 14.8878 KOps/s | 14.2671 KOps/s | |
| test_setitem_dim[range] | 0.1618ms | 0.1271ms | 7.8694 KOps/s | 7.4761 KOps/s | |
| test_setitem_dim[tuple] | 92.2540μs | 60.5467μs | 16.5162 KOps/s | 15.7874 KOps/s | |
| test_setitem | 80.1840μs | 40.3615μs | 24.7761 KOps/s | 23.4353 KOps/s | |
| test_set | 86.6440μs | 39.7336μs | 25.1676 KOps/s | 24.3835 KOps/s | |
| test_set_shared | 0.3758ms | 53.4165μs | 18.7208 KOps/s | 18.6145 KOps/s | |
| test_update | 88.3740μs | 49.2296μs | 20.3130 KOps/s | 19.4850 KOps/s | |
| test_update_nested | 96.7740μs | 57.4292μs | 17.4127 KOps/s | 17.0316 KOps/s | |
| test_update__nested | 0.2149ms | 60.8410μs | 16.4363 KOps/s | 16.3073 KOps/s | |
| test_set_nested | 83.2240μs | 43.2639μs | 23.1140 KOps/s | 22.6179 KOps/s | |
| test_set_nested_new | 85.3240μs | 46.7683μs | 21.3820 KOps/s | 20.6985 KOps/s | |
| test_select | 0.1044ms | 59.5940μs | 16.7802 KOps/s | 16.5172 KOps/s | |
| test_select_nested | 81.2840μs | 41.9175μs | 23.8564 KOps/s | 24.1357 KOps/s | |
| test_exclude_nested | 87.8640μs | 59.1846μs | 16.8963 KOps/s | 17.0999 KOps/s | |
| test_empty[True] | 0.8788ms | 0.2629ms | 3.8044 KOps/s | 3.8335 KOps/s | |
| test_empty[False] | 3.4472μs | 0.7404μs | 1.3505 MOps/s | 1.3499 MOps/s | |
| test_to | 47.8720μs | 26.6757μs | 37.4873 KOps/s | 37.7080 KOps/s | |
| test_to_nonblocking | 59.0830μs | 24.2448μs | 41.2459 KOps/s | 38.7367 KOps/s | |
| test_unbind_speed | 0.9806ms | 0.2753ms | 3.6321 KOps/s | 3.5070 KOps/s | |
| test_unbind_speed_stack0 | 0.3319ms | 0.2770ms | 3.6107 KOps/s | 3.4997 KOps/s | |
| test_unbind_speed_stack1 | 91.7151ms | 0.7050ms | 1.4184 KOps/s | 1.3853 KOps/s | |
| test_split | 93.0734ms | 2.2094ms | 452.6184 Ops/s | 452.8856 Ops/s | |
| test_chunk | 95.0431ms | 2.1937ms | 455.8590 Ops/s | 451.7621 Ops/s | |
| test_creation[device0] | 0.3779ms | 0.1268ms | 7.8873 KOps/s | 7.7713 KOps/s | |
| test_creation_from_tensor | 0.4521ms | 0.1287ms | 7.7720 KOps/s | 7.6904 KOps/s | |
| test_add_one[memmap_tensor0] | 0.1453ms | 8.5791μs | 116.5624 KOps/s | 114.1336 KOps/s | |
| test_contiguous[memmap_tensor0] | 38.3520μs | 2.1857μs | 457.5144 KOps/s | 452.7050 KOps/s | |
| test_stack[memmap_tensor0] | 30.8510μs | 6.7825μs | 147.4378 KOps/s | 144.8199 KOps/s | |
| test_memmaptd_index | 1.0836ms | 0.4204ms | 2.3787 KOps/s | 2.2931 KOps/s | |
| test_memmaptd_index_astensor | 0.7841ms | 0.4897ms | 2.0422 KOps/s | 1.9785 KOps/s | |
| test_memmaptd_index_op | 1.3820ms | 1.0022ms | 997.7696 Ops/s | 933.1523 Ops/s | |
| test_serialize_model | 0.1332s | 0.1303s | 7.6752 Ops/s | 7.6966 Ops/s | |
| test_serialize_model_pickle | 1.3476s | 1.2125s | 0.8248 Ops/s | 0.8242 Ops/s | |
| test_serialize_weights | 0.1296s | 0.1286s | 7.7788 Ops/s | 7.7457 Ops/s | |
| test_serialize_weights_returnearly | 0.2326s | 62.0340ms | 16.1202 Ops/s | 18.0388 Ops/s | |
| test_serialize_weights_pickle | 1.3773s | 1.2167s | 0.8219 Ops/s | 0.8217 Ops/s | |
| test_reshape_pytree | 81.5940μs | 36.2021μs | 27.6227 KOps/s | 27.7625 KOps/s | |
| test_reshape_td | 77.9340μs | 43.0845μs | 23.2102 KOps/s | 22.8708 KOps/s | |
| test_view_pytree | 70.0930μs | 36.1519μs | 27.6611 KOps/s | 28.0643 KOps/s | |
| test_view_td | 87.2840μs | 48.3202μs | 20.6953 KOps/s | 21.4369 KOps/s | |
| test_unbind_pytree | 62.4830μs | 34.6063μs | 28.8965 KOps/s | 29.0877 KOps/s | |
| test_unbind_td | 0.5180ms | 42.4501μs | 23.5571 KOps/s | 22.9592 KOps/s | |
| test_split_pytree | 83.8240μs | 44.8497μs | 22.2967 KOps/s | 21.0458 KOps/s | |
| test_split_td | 0.6009ms | 56.6801μs | 17.6429 KOps/s | 14.6642 KOps/s | |
| test_add_pytree | 88.3240μs | 55.6824μs | 17.9590 KOps/s | 17.3786 KOps/s | |
| test_add_td | 0.1449ms | 99.6833μs | 10.0318 KOps/s | 10.3191 KOps/s | |
| test_compile_add_one_nested[tensordict-compile] | 0.2679ms | 0.1610ms | 6.2126 KOps/s | 6.1211 KOps/s | |
| test_compile_add_one_nested[tensordict-eager] | 0.2646ms | 0.1649ms | 6.0633 KOps/s | 6.0038 KOps/s | |
| test_compile_add_one_nested[pytree-compile] | 0.1851ms | 0.1444ms | 6.9255 KOps/s | 6.8974 KOps/s | |
| test_compile_add_one_nested[pytree-eager] | 0.2432ms | 0.1818ms | 5.5016 KOps/s | 5.4446 KOps/s | |
| test_compile_copy_nested[tensordict-compile] | 57.1430μs | 20.8154μs | 48.0414 KOps/s | 47.1995 KOps/s | |
| test_compile_copy_nested[tensordict-eager] | 82.6440μs | 48.6710μs | 20.5461 KOps/s | 19.9049 KOps/s | |
| test_compile_copy_nested[pytree-compile] | 0.2130ms | 64.1752μs | 15.5823 KOps/s | 15.5722 KOps/s | |
| test_compile_copy_nested[pytree-eager] | 84.1440μs | 49.9529μs | 20.0189 KOps/s | 20.2724 KOps/s | |
| test_compile_add_one_flat[tensordict-compile] | 0.6989ms | 0.3187ms | 3.1381 KOps/s | 3.0875 KOps/s | |
| test_compile_add_one_flat[tensordict-eager] | 0.6490ms | 0.2403ms | 4.1612 KOps/s | 4.3234 KOps/s | |
| test_compile_add_one_flat[tensorclass-compile] | 0.5197ms | 0.1269ms | 7.8823 KOps/s | 7.8116 KOps/s | |
| test_compile_add_one_flat[tensorclass-eager] | 0.1236ms | 66.4313μs | 15.0531 KOps/s | 15.3141 KOps/s | |
| test_compile_add_one_flat[pytree-compile] | 0.7370ms | 0.3192ms | 3.1325 KOps/s | 3.1287 KOps/s | |
| test_compile_add_one_flat[pytree-eager] | 1.0219ms | 0.6075ms | 1.6462 KOps/s | 1.5916 KOps/s | |
| test_compile_add_self_flat[tensordict-eager] | 0.6895ms | 0.2886ms | 3.4652 KOps/s | 3.5470 KOps/s | |
| test_compile_add_self_flat[tensordict-compile] | 0.4098ms | 0.3203ms | 3.1218 KOps/s | 3.0368 KOps/s | |
| test_compile_add_self_flat[tensorclass-eager] | 0.1365ms | 79.7706μs | 12.5360 KOps/s | 12.8881 KOps/s | |
| test_compile_add_self_flat[tensorclass-compile] | 0.1966ms | 0.1272ms | 7.8632 KOps/s | 7.6616 KOps/s | |
| test_compile_add_self_flat[pytree-eager] | 0.6461ms | 0.5202ms | 1.9225 KOps/s | 1.8973 KOps/s | |
| test_compile_add_self_flat[pytree-compile] | 0.3663ms | 0.3168ms | 3.1563 KOps/s | 3.1095 KOps/s | |
| test_compile_copy_flat[tensordict-compile] | 0.1017ms | 18.6941μs | 53.4927 KOps/s | 49.8995 KOps/s | |
| test_compile_copy_flat[tensordict-eager] | 0.4235ms | 38.1648μs | 26.2021 KOps/s | 23.9730 KOps/s | |
| test_compile_copy_flat[pytree-compile] | 0.4607ms | 68.9482μs | 14.5036 KOps/s | 14.4921 KOps/s | |
| test_compile_copy_flat[pytree-eager] | 0.4364ms | 51.6364μs | 19.3662 KOps/s | 19.5953 KOps/s | |
| test_compile_assign_and_add[tensordict-compile] | 2.3551ms | 0.8201ms | 1.2194 KOps/s | 1.1024 KOps/s | |
| test_compile_assign_and_add[tensordict-eager] | 3.3692ms | 3.1224ms | 320.2688 Ops/s | 311.8832 Ops/s | |
| test_compile_assign_and_add[pytree-compile] | 2.2988ms | 0.8089ms | 1.2362 KOps/s | 1.1123 KOps/s | |
| test_compile_assign_and_add[pytree-eager] | 3.3726ms | 3.1403ms | 318.4421 Ops/s | 313.1263 Ops/s | |
| test_compile_indexing[tensor-tensordict-compile] | 0.1523ms | 0.1080ms | 9.2632 KOps/s | 9.2701 KOps/s | |
| test_compile_indexing[tensor-tensordict-eager] | 0.1819ms | 60.9805μs | 16.3987 KOps/s | 16.5585 KOps/s | |
| test_compile_indexing[tensor-tensorclass-compile] | 0.1562ms | 0.1075ms | 9.3046 KOps/s | 9.6316 KOps/s | |
| test_compile_indexing[tensor-tensorclass-eager] | 0.1756ms | 46.6720μs | 21.4261 KOps/s | 22.9255 KOps/s | |
| test_compile_indexing[tensor-pytree-compile] | 0.1588ms | 0.1080ms | 9.2612 KOps/s | 9.5232 KOps/s | |
| test_compile_indexing[tensor-pytree-eager] | 0.1048ms | 43.7677μs | 22.8479 KOps/s | 22.7801 KOps/s | |
| test_compile_indexing[slice-tensordict-compile] | 0.1753ms | 0.1362ms | 7.3434 KOps/s | 7.2832 KOps/s | |
| test_compile_indexing[slice-tensordict-eager] | 0.1511ms | 24.7278μs | 40.4402 KOps/s | 39.4353 KOps/s | |
| test_compile_indexing[slice-tensorclass-compile] | 0.1773ms | 0.1307ms | 7.6498 KOps/s | 7.6396 KOps/s | |
| test_compile_indexing[slice-tensorclass-eager] | 52.3220μs | 21.2469μs | 47.0656 KOps/s | 47.1784 KOps/s | |
| test_compile_indexing[slice-pytree-compile] | 0.1901ms | 0.1314ms | 7.6098 KOps/s | 7.5287 KOps/s | |
| test_compile_indexing[slice-pytree-eager] | 53.9630μs | 20.2874μs | 49.2916 KOps/s | 47.0535 KOps/s | |
| test_compile_indexing[int-tensordict-compile] | 0.1954ms | 0.1373ms | 7.2831 KOps/s | 7.2271 KOps/s | |
| test_compile_indexing[int-tensordict-eager] | 0.5114ms | 25.3344μs | 39.4721 KOps/s | 39.1663 KOps/s | |
| test_compile_indexing[int-tensorclass-compile] | 0.1737ms | 0.1312ms | 7.6233 KOps/s | 7.5507 KOps/s | |
| test_compile_indexing[int-tensorclass-eager] | 0.1008ms | 28.8141μs | 34.7052 KOps/s | 47.5699 KOps/s | |
| test_compile_indexing[int-pytree-compile] | 0.2240ms | 0.1317ms | 7.5950 KOps/s | 7.5488 KOps/s | |
| test_compile_indexing[int-pytree-eager] | 57.7620μs | 20.3034μs | 49.2527 KOps/s | 47.1205 KOps/s | |
| test_mod_add[eager] | 84.2240μs | 31.2291μs | 32.0214 KOps/s | 28.9555 KOps/s | |
| test_mod_add[compile] | 0.1266ms | 70.7762μs | 14.1290 KOps/s | 14.2642 KOps/s | |
| test_mod_add[compile-overhead] | 0.2579ms | 0.1348ms | 7.4164 KOps/s | 7.0788 KOps/s | |
| test_mod_wrap[eager] | 0.8645ms | 0.7755ms | 1.2895 KOps/s | 1.2586 KOps/s | |
| test_mod_wrap[compile] | 2.0871ms | 0.8288ms | 1.2066 KOps/s | 1.1922 KOps/s | |
| test_mod_wrap[compile-overhead] | 4.9069ms | 3.0911ms | 323.5066 Ops/s | 323.4257 Ops/s | |
| test_mod_wrap_and_backward[eager] | 4.1610ms | 4.0528ms | 246.7425 Ops/s | 236.8333 Ops/s | |
| test_mod_wrap_and_backward[compile] | 4.4963ms | 3.9932ms | 250.4234 Ops/s | 239.1502 Ops/s | |
| test_mod_wrap_and_backward[compile-overhead] | 1.3187ms | 0.9007ms | 1.1103 KOps/s | 975.9782 Ops/s | |
| test_seq_add[eager] | 0.4832ms | 95.7321μs | 10.4458 KOps/s | 10.0374 KOps/s | |
| test_seq_add[compile] | 0.1325ms | 81.1587μs | 12.3215 KOps/s | 12.2030 KOps/s | |
| test_seq_add[compile-overhead] | 0.1662ms | 0.1137ms | 8.7981 KOps/s | 8.6668 KOps/s | |
| test_seq_wrap[eager] | 1.3205ms | 0.9259ms | 1.0800 KOps/s | 1.0520 KOps/s | |
| test_seq_wrap[compile] | 1.2398ms | 0.8425ms | 1.1870 KOps/s | 1.1638 KOps/s | |
| test_seq_wrap[compile-overhead] | 0.2768ms | 0.2197ms | 4.5517 KOps/s | 4.5003 KOps/s | |
| test_func_call_runtime[False-eager] | 2.7697ms | 2.3559ms | 424.4629 Ops/s | 413.0988 Ops/s | |
| test_func_call_runtime[False-compile] | 2.4459ms | 2.3594ms | 423.8340 Ops/s | 413.6143 Ops/s | |
| test_func_call_runtime[False-compile-overhead] | 0.4001ms | 0.3569ms | 2.8016 KOps/s | 2.7681 KOps/s | |
| test_func_call_runtime[True-eager] | 2.5996ms | 2.5301ms | 395.2417 Ops/s | 384.5411 Ops/s | |
| test_func_call_runtime[True-compile] | 2.4810ms | 2.4057ms | 415.6715 Ops/s | 408.2014 Ops/s | |
| test_func_call_runtime[True-compile-overhead] | 0.4259ms | 0.3762ms | 2.6578 KOps/s | 2.6001 KOps/s | |
| test_func_call_cm_runtime[False-eager] | 2.4304ms | 2.3602ms | 423.6964 Ops/s | 412.2232 Ops/s | |
| test_func_call_cm_runtime[False-compile] | 2.4590ms | 2.3897ms | 418.4665 Ops/s | 412.2039 Ops/s | |
| test_func_call_cm_runtime[False-compile-overhead] | 0.4367ms | 0.3593ms | 2.7833 KOps/s | 2.7471 KOps/s | |
| test_func_call_cm_runtime[True-eager] | 2.7034ms | 2.6312ms | 380.0606 Ops/s | 371.0252 Ops/s | |
| test_func_call_cm_runtime[True-compile] | 2.5060ms | 2.4355ms | 410.5979 Ops/s | 404.8622 Ops/s | |
| test_func_call_cm_runtime[True-compile-overhead] | 0.4865ms | 0.4048ms | 2.4701 KOps/s | 2.4333 KOps/s | |
| test_vmap_func_call_cm_runtime[eager] | 4.2002ms | 3.7574ms | 266.1418 Ops/s | 260.4512 Ops/s | |
| test_vmap_func_call_cm_runtime[compile] | 2.5837ms | 2.4596ms | 406.5667 Ops/s | 398.9787 Ops/s | |
| test_vmap_func_call_cm_runtime[compile-overhead] | 0.5135ms | 0.4058ms | 2.4641 KOps/s | 2.4316 KOps/s | |
| test_distributed | 4.0271ms | 0.2187ms | 4.5729 KOps/s | 8.4989 KOps/s | |
| test_tdmodule | 91.8440μs | 15.3296μs | 65.2331 KOps/s | 63.3729 KOps/s | |
| test_tdmodule_dispatch | 49.5930μs | 29.6402μs | 33.7380 KOps/s | 32.5702 KOps/s | |
| test_tdseq | 45.1420μs | 15.8661μs | 63.0274 KOps/s | 59.3014 KOps/s | |
| test_tdseq_dispatch | 44.1120μs | 31.1807μs | 32.0711 KOps/s | 29.5634 KOps/s | |
| test_instantiation_functorch | 2.0316ms | 1.8615ms | 537.2049 Ops/s | 537.6537 Ops/s | |
| test_instantiation_td | 1.8144ms | 1.2018ms | 832.0595 Ops/s | 832.3529 Ops/s | |
| test_exec_functorch | 1.0759ms | 0.9917ms | 1.0084 KOps/s | 981.5476 Ops/s | |
| test_exec_functional_call | 1.0629ms | 0.9913ms | 1.0088 KOps/s | 979.0682 Ops/s | |
| test_exec_td | 1.1017ms | 1.0192ms | 981.1907 Ops/s | 951.7994 Ops/s | |
| test_exec_td_decorator | 1.6075ms | 1.0453ms | 956.6372 Ops/s | 923.7262 Ops/s | |
| test_vmap_mlp_speed[True-True] | 1.3196ms | 1.2575ms | 795.2005 Ops/s | 780.3212 Ops/s | |
| test_vmap_mlp_speed[True-False] | 1.3881ms | 1.2550ms | 796.8014 Ops/s | 784.3898 Ops/s | |
| test_vmap_mlp_speed[False-True] | 1.2449ms | 1.1483ms | 870.8893 Ops/s | 860.9543 Ops/s | |
| test_vmap_mlp_speed[False-False] | 1.2418ms | 1.1488ms | 870.4632 Ops/s | 861.8601 Ops/s | |
| test_vmap_mlp_speed_decorator[True-True] | 1.9839ms | 1.2307ms | 812.5206 Ops/s | 799.3766 Ops/s | |
| test_vmap_mlp_speed_decorator[True-False] | 1.3558ms | 1.2316ms | 811.9595 Ops/s | 800.4062 Ops/s | |
| test_vmap_mlp_speed_decorator[False-True] | 1.2821ms | 1.1505ms | 869.1907 Ops/s | 860.7776 Ops/s | |
| test_vmap_mlp_speed_decorator[False-False] | 1.3372ms | 1.1514ms | 868.5049 Ops/s | 856.4258 Ops/s | |
| test_vmap_transformer_speed[True-True] | 13.1433ms | 13.0455ms | 76.6550 Ops/s | 75.5497 Ops/s | |
| test_vmap_transformer_speed[True-False] | 13.0746ms | 12.9873ms | 76.9985 Ops/s | 75.2467 Ops/s | |
| test_vmap_transformer_speed[False-True] | 12.8704ms | 12.7987ms | 78.1327 Ops/s | 76.6216 Ops/s | |
| test_vmap_transformer_speed[False-False] | 12.8975ms | 12.8279ms | 77.9552 Ops/s | 76.4692 Ops/s | |
| test_vmap_transformer_speed_decorator[True-True] | 33.6199ms | 33.4858ms | 29.8634 Ops/s | 29.5411 Ops/s | |
| test_vmap_transformer_speed_decorator[True-False] | 33.6447ms | 33.5319ms | 29.8223 Ops/s | 29.5063 Ops/s | |
| test_vmap_transformer_speed_decorator[False-True] | 34.2442ms | 33.3924ms | 29.9469 Ops/s | 29.5543 Ops/s | |
| test_vmap_transformer_speed_decorator[False-False] | 33.5067ms | 33.4106ms | 29.9307 Ops/s | 29.5457 Ops/s | |
| test_to_module_speed[True] | 1.5319ms | 0.9985ms | 1.0015 KOps/s | 997.0271 Ops/s | |
| test_to_module_speed[False] | 1.3613ms | 0.9687ms | 1.0323 KOps/s | 1.0334 KOps/s | |
| test_tc_init | 0.1077ms | 32.5140μs | 30.7560 KOps/s | 27.0390 KOps/s | |
| test_tc_init_nested | 0.1098ms | 66.2193μs | 15.1013 KOps/s | 13.0194 KOps/s | |
| test_tc_first_layer_tensor | 4.4489μs | 0.6712μs | 1.4899 MOps/s | 1.4632 MOps/s | |
| test_tc_first_layer_nontensor | 30.9210μs | 2.2540μs | 443.6615 KOps/s | 436.9556 KOps/s | |
| test_tc_second_layer_tensor | 10.6737μs | 1.3835μs | 722.8204 KOps/s | 732.4709 KOps/s | |
| test_tc_second_layer_nontensor | 28.5510μs | 2.9782μs | 335.7693 KOps/s | 337.5372 KOps/s | |
| test_unbind | 0.1957s | 12.1344ms | 82.4101 Ops/s | 91.3055 Ops/s | |
| test_full_like | 0.6557ms | 0.5731ms | 1.7448 KOps/s | 1.7395 KOps/s | |
| test_zeros_like | 0.2872ms | 0.1979ms | 5.0533 KOps/s | 5.0560 KOps/s | |
| test_ones_like | 0.2341ms | 0.1978ms | 5.0566 KOps/s | 5.0571 KOps/s | |
| test_clone | 0.4528ms | 0.4138ms | 2.4169 KOps/s | 2.4161 KOps/s | |
| test_squeeze | 32.8920μs | 9.9123μs | 100.8852 KOps/s | 101.4107 KOps/s | |
| test_unsqueeze | 0.2215ms | 74.3259μs | 13.4543 KOps/s | 13.0002 KOps/s | |
| test_split | 0.3844ms | 0.1552ms | 6.4422 KOps/s | 6.1850 KOps/s | |
| test_permute | 0.2449ms | 0.1802ms | 5.5483 KOps/s | 5.5203 KOps/s | |
| test_stack | 1.2542ms | 0.8637ms | 1.1578 KOps/s | 1.1412 KOps/s | |
| test_cat | 1.2512ms | 1.2314ms | 812.0957 Ops/s | 812.0762 Ops/s |
Sign up for free
to join this conversation on GitHub.
Already have an account?
Sign in to comment
Labels
CLA Signed
This label is managed by the Facebook bot. Authors need to sign the CLA before a PR can be reviewed.
Add this suggestion to a batch that can be applied as a single commit.
This suggestion is invalid because no changes were made to the code.
Suggestions cannot be applied while the pull request is closed.
Suggestions cannot be applied while viewing a subset of changes.
Only one suggestion per line can be applied in a batch.
Add this suggestion to a batch that can be applied as a single commit.
Applying suggestions on deleted lines is not supported.
You must change the existing code in this line in order to create a valid suggestion.
Outdated suggestions cannot be applied.
This suggestion has been applied or marked resolved.
Suggestions cannot be applied from pending reviews.
Suggestions cannot be applied on multi-line comments.
Suggestions cannot be applied while the pull request is queued to merge.
Suggestion cannot be applied right now. Please check back later.
Stack from ghstack (oldest at bottom):