Layer Information
layer_index | layer_name | layer_type | layer_shape | layer_duration (us) | layer_allocated_bytes | layer_peak_allocated_bytes | layer_allocator_bytes_in_use | layer_allocator_name | layer_host_temp_mem_bytes | layer_device_temp_mem_bytes | layer_host_persistent_mem_bytes | layer_device_persistent_mem_bytes |
---|
layer_index | layer_name | layer_type | layer_shape | layer_duration (us) | layer_allocated_bytes | layer_peak_allocated_bytes | layer_allocator_bytes_in_use | layer_allocator_name | layer_host_temp_mem_bytes | layer_device_temp_mem_bytes | layer_host_persistent_mem_bytes | layer_device_persistent_mem_bytes |
---|---|---|---|---|---|---|---|---|---|---|---|---|
2 | conv2d0 | _FusedConv2D | [[1 112 112 64]] | 4824.333 | 4190208 | 4190208 | 4192938.667 | cuda_host_bfc | 0 | 0 | 0 | 0 |
3 | maxpool0 | MaxPool | [[1 56 56 64]] | 728.333 | 802816 | 802816 | 4995754.667 | cuda_host_bfc | 0 | 0 | 0 | 0 |
4 | localresponsenorm0 | LRN | [[1 56 56 64]] | 449.333 | 802816 | 802816 | 1608362.667 | cuda_host_bfc | 0 | 0 | 0 | 0 |
5 | conv2d1 | _FusedConv2D | [[1 56 56 64]] | 318.667 | 802816 | 802816 | 1608362.667 | cuda_host_bfc | 0 | 0 | 0 | 0 |
6 | conv2d2 | _FusedConv2D | [[1 56 56 192]] | 4816.333 | 3391488 | 3391488 | 4197034.667 | cuda_host_bfc | 0 | 0 | 0 | 0 |
7 | localresponsenorm1 | LRN | [[1 56 56 192]] | 1891 | 4190208 | 4190208 | 7584426.667 | cuda_host_bfc | 0 | 0 | 0 | 0 |
8 | maxpool1 | MaxPool | [[1 28 28 192]] | 314.333 | 602112 | 602112 | 4795050.667 | cuda_host_bfc | 0 | 0 | 0 | 0 |
9 | mixed3a_5x5_bottleneck | _FusedConv2D | [[1 28 28 16]] | 508.333 | 50176 | 50176 | 1790976 | cuda_host_bfc | 0 | 0 | 0 | 0 |
10 | mixed3a_pool | MaxPool | [[1 28 28 192]] | 465.333 | 602112 | 602112 | 1792341.333 | cuda_host_bfc | 0 | 0 | 0 | 0 |
11 | mixed3a_1x1 | _FusedConv2D | [[1 28 28 64]] | 505.667 | 200704 | 200704 | 1859242.667 | cuda_host_bfc | 0 | 0 | 0 | 0 |
12 | mixed3a_3x3_bottleneck | _FusedConv2D | [[1 28 28 96]] | 623 | 301056 | 301056 | 1924778.667 | cuda_host_bfc | 0 | 0 | 0 | 0 |
13 | mixed3a_pool_reduce | _FusedConv2D | [[1 28 28 32]] | 322 | 100352 | 100352 | 1958229.333 | cuda_host_bfc | 0 | 0 | 0 | 0 |
14 | mixed3a_5x5 | _FusedConv2D | [[1 28 28 32]] | 650 | 100352 | 100352 | 1289216 | cuda_host_bfc | 0 | 0 | 0 | 0 |
15 | mixed3a_3x3 | _FusedConv2D | [[1 28 28 128]] | 1440.333 | 535210.667 | 535210.667 | 1239040 | cuda_host_bfc | 0 | 0 | 0 | 0 |
16 | mixed3a | Concat | [[1 28 28 256]] | 148 | 953344 | 953344 | 1941504 | cuda_host_bfc | 0 | 0 | 0 | 0 |
17 | mixed3b_pool | MaxPool | [[1 28 28 256]] | 501.667 | 802816 | 802816 | 2712234.667 | cuda_host_bfc | 0 | 0 | 0 | 0 |
18 | mixed3b_1x1 | _FusedConv2D | [[1 28 28 128]] | 1166 | 401408 | 401408 | 2996565.333 | cuda_host_bfc | 0 | 0 | 0 | 0 |
19 | mixed3b_5x5_bottleneck | _FusedConv2D | [[1 28 28 32]] | 1045.333 | 100352 | 100352 | 2829312 | cuda_host_bfc | 0 | 0 | 0 | 0 |
20 | mixed3b_pool_reduce | _FusedConv2D | [[1 28 28 64]] | 733.333 | 200704 | 200704 | 3113642.667 | cuda_host_bfc | 0 | 0 | 0 | 0 |
21 | mixed3b_3x3_bottleneck | _FusedConv2D | [[1 28 28 128]] | 1303.667 | 401408 | 401408 | 2411178.667 | cuda_host_bfc | 0 | 0 | 0 | 0 |
22 | mixed3b_5x5 | _FusedConv2D | [[1 28 28 96]] | 2523.667 | 301056 | 301056 | 2440874.667 | cuda_host_bfc | 0 | 0 | 0 | 0 |
23 | mixed3b_3x3 | _FusedConv2D | [[1 28 28 192]] | 3177.667 | 999765.333 | 999765.333 | 2340522.667 | cuda_host_bfc | 0 | 0 | 0 | 0 |
24 | mixed3b | Concat | [[1 28 28 480]] | 164.667 | 1940138.667 | 1940138.667 | 3930794.667 | cuda_host_bfc | 0 | 0 | 0 | 0 |
25 | maxpool4 | MaxPool | [[1 14 14 480]] | 186.333 | 376320 | 376320 | 2320554.667 | cuda_host_bfc | 0 | 0 | 0 | 0 |
26 | mixed4a_pool | MaxPool | [[1 14 14 480]] | 266.667 | 376320 | 376320 | 995072 | cuda_host_bfc | 0 | 0 | 0 | 0 |
27 | mixed4a_5x5_bottleneck | _FusedConv2D | [[1 14 14 16]] | 382.667 | 12544 | 12544 | 1043882.667 | cuda_host_bfc | 0 | 0 | 0 | 0 |
28 | mixed4a_3x3_bottleneck | _FusedConv2D | [[1 14 14 96]] | 528.667 | 75264 | 75264 | 1068970.667 | cuda_host_bfc | 0 | 0 | 0 | 0 |
29 | mixed4a_pool_reduce | _FusedConv2D | [[1 14 14 64]] | 425.333 | 50176 | 50176 | 1237333.333 | cuda_host_bfc | 0 | 0 | 0 | 0 |
30 | mixed4a_5x5 | _FusedConv2D | [[1 14 14 48]] | 401.667 | 37632 | 37632 | 938666.667 | cuda_host_bfc | 0 | 0 | 0 | 0 |
31 | mixed4a_1x1 | _FusedConv2D | [[1 14 14 192]] | 883 | 150528 | 150528 | 856832 | cuda_host_bfc | 0 | 0 | 0 | 0 |
32 | mixed4a_3x3 | _FusedConv2D | [[1 14 14 204]] | 769.667 | 160000 | 160000 | 476330.667 | cuda_host_bfc | 0 | 0 | 0 | 0 |
33 | mixed4a | Concat | [[1 14 14 508]] | 114.667 | 443221.333 | 443221.333 | 843264 | cuda_host_bfc | 0 | 0 | 0 | 0 |
34 | head0_pool | AvgPool | [[1 4 4 508]] | 72.667 | 32512 | 32512 | 477440 | cuda_host_bfc | 0 | 0 | 0 | 0 |
35 | head0_bottleneck | _FusedConv2D | [[1 4 4 128]] | 123.667 | 8192 | 8192 | 43434.667 | cuda_host_bfc | 0 | 0 | 0 | 0 |
36 | head0_bottleneck/reshape | Reshape | [[1 2048]] | 8.333 | 8192 | 0 | 0 | cuda_host_bfc | 0 | 0 | 0 | 0 |
37 | nn0_pre_relu/matmul | MatMul | [[1 1024]] | 746 | 4096 | 4096 | 15018.667 | cuda_host_bfc | 0 | 0 | 0 | 0 |
38 | nn0_pre_relu | BiasAdd | [[1 1024]] | 11.333 | 4096 | 0 | 0 | cuda_host_bfc | 0 | 0 | 0 | 0 |
39 | nn0 | Relu | [[1 1024]] | 6 | 4096 | 0 | 0 | cuda_host_bfc | 0 | 0 | 0 | 0 |
40 | softmax0_pre_activation/matmul | MatMul | [[1 1008]] | 389 | 4096 | 4096 | 10922.667 | cuda_host_bfc | 0 | 0 | 0 | 0 |
41 | softmax0_pre_activation | BiasAdd | [[1 1008]] | 7.333 | 4096 | 0 | 0 | cuda_host_bfc | 0 | 0 | 0 | 0 |
42 | softmax0 | Softmax | [[1 1008]] | 40 | 4096 | 0 | 0 | cuda_host_bfc | 0 | 0 | 0 | 0 |
43 | output | Identity | [[1 1008]] | 5 | 4096 | 0 | 0 | cuda_host_bfc | 0 | 0 | 0 | 0 |
Showing 1 to 42 of 42 entries