{"ts": "2025-11-10T21:59:00Z", "run": "af78c748d8aa44afbf8c01edaace0f7f", "impl": "torch_eager", "tags": {"family": "pytorch", "backend": "eager"}, "wl": {"name": "cuda_B1_Q100_H8_E256_L4_P4", "batch_size": 1, "num_queries": 100, "num_heads": 8, "embed_dim": 256, "num_levels": 4, "num_points": 4, "spatial_shapes": [[32, 32], [16, 16], [8, 8], [4, 4]], "dtype": "float32", "device": "cuda", "seed": 0}, "env": {"torch": "2.8.0+cu128", "cuda": "12.8", "gpu": "NVIDIA L40S", "sm": "8.9", "py": "3.11.14", "plat": "Linux-6.12.53-69.119.amzn2023.x86_64-x86_64-with-glibc2.35"}, "lat_ms": {"p10": 3.269501999966451, "p50": 3.2801430000404252, "p90": 3.3024029999637605, "mean": 3.289842799995313, "iqr": 0.02382099995656972, "raw_times": [3.3185839999987365, 3.2801430000404252, 3.269501999966451, 3.278582000007191, 3.3024029999637605], "has_warnings": false, "reps": 5, "warmup": 2}, "compile_ms": 3.341974000022674, "peak_bytes": 5929472, "ok": true, "absmax": 0.0, "corr": {"ok": true, "rtol": 1e-05, "atol": 1e-05, "absmax": 0.0, "mae": 0.0, "mse": 0.0, "ref": "deformable_detr_torch"}, "err": null} {"ts": "2025-11-10T21:59:00Z", "run": "af78c748d8aa44afbf8c01edaace0f7f", "impl": "torch_eager", "tags": {"family": "pytorch", "backend": "eager"}, "wl": {"name": "cuda_B1_Q300_H8_E256_L4_P4", "batch_size": 1, "num_queries": 300, "num_heads": 8, "embed_dim": 256, "num_levels": 4, "num_points": 4, "spatial_shapes": [[32, 32], [16, 16], [8, 8], [4, 4]], "dtype": "float32", "device": "cuda", "seed": 0}, "env": {"torch": "2.8.0+cu128", "cuda": "12.8", "gpu": "NVIDIA L40S", "sm": "8.9", "py": "3.11.14", "plat": "Linux-6.12.53-69.119.amzn2023.x86_64-x86_64-with-glibc2.35"}, "lat_ms": {"p10": 3.9856040000358917, "p50": 4.010704999984682, "p90": 4.045005000023139, "mean": 4.019770599995809, "iqr": 0.05120100007616202, "raw_times": [4.045005000023139, 4.063734999988355, 4.010704999984682, 3.9856040000358917, 3.9938039999469765], "has_warnings": false, "reps": 5, "warmup": 2}, "compile_ms": 4.026463999991847, "peak_bytes": 15161856, "ok": true, "absmax": 0.0, "corr": {"ok": true, "rtol": 1e-05, "atol": 1e-05, "absmax": 0.0, "mae": 0.0, "mse": 0.0, "ref": "deformable_detr_torch"}, "err": null} {"ts": "2025-11-10T21:59:01Z", "run": "af78c748d8aa44afbf8c01edaace0f7f", "impl": "torch_eager", "tags": {"family": "pytorch", "backend": "eager"}, "wl": {"name": "cuda_B2_Q100_H8_E256_L4_P4", "batch_size": 2, "num_queries": 100, "num_heads": 8, "embed_dim": 256, "num_levels": 4, "num_points": 4, "spatial_shapes": [[32, 32], [16, 16], [8, 8], [4, 4]], "dtype": "float32", "device": "cuda", "seed": 0}, "env": {"torch": "2.8.0+cu128", "cuda": "12.8", "gpu": "NVIDIA L40S", "sm": "8.9", "py": "3.11.14", "plat": "Linux-6.12.53-69.119.amzn2023.x86_64-x86_64-with-glibc2.35"}, "lat_ms": {"p10": 4.021324000007098, "p50": 4.030125000042517, "p90": 4.037073999995755, "mean": 4.049654600009944, "iqr": 0.01115999998546613, "raw_times": [4.037073999995755, 4.021324000007098, 4.133835999994062, 4.030125000042517, 4.025914000010289], "has_warnings": false, "reps": 5, "warmup": 2}, "compile_ms": 4.049624999993284, "peak_bytes": 11958784, "ok": true, "absmax": 0.0, "corr": {"ok": true, "rtol": 1e-05, "atol": 1e-05, "absmax": 0.0, "mae": 0.0, "mse": 0.0, "ref": "deformable_detr_torch"}, "err": null} {"ts": "2025-11-10T21:59:01Z", "run": "af78c748d8aa44afbf8c01edaace0f7f", "impl": "torch_eager", "tags": {"family": "pytorch", "backend": "eager"}, "wl": {"name": "cuda_B2_Q300_H8_E256_L4_P4", "batch_size": 2, "num_queries": 300, "num_heads": 8, "embed_dim": 256, "num_levels": 4, "num_points": 4, "spatial_shapes": [[32, 32], [16, 16], [8, 8], [4, 4]], "dtype": "float32", "device": "cuda", "seed": 0}, "env": {"torch": "2.8.0+cu128", "cuda": "12.8", "gpu": "NVIDIA L40S", "sm": "8.9", "py": "3.11.14", "plat": "Linux-6.12.53-69.119.amzn2023.x86_64-x86_64-with-glibc2.35"}, "lat_ms": {"p10": 4.128727000022536, "p50": 4.140276000043741, "p90": 4.142176000016207, "mean": 4.14041620002763, "iqr": 0.006619999965096213, "raw_times": [4.155346000004556, 4.140276000043741, 4.1355560000511105, 4.128727000022536, 4.142176000016207], "has_warnings": false, "reps": 5, "warmup": 2}, "compile_ms": 4.139206999980161, "peak_bytes": 30977024, "ok": true, "absmax": 0.0, "corr": {"ok": true, "rtol": 1e-05, "atol": 1e-05, "absmax": 0.0, "mae": 0.0, "mse": 0.0, "ref": "deformable_detr_torch"}, "err": null}