|
| 1 | +Namespace(model='deit_base', dataset='dataset/imagenet/', calib_batchsize=32, val_batchsize=200, num_workers=8, device='cuda', print_freq=100, seed=0, w_bits=4, a_bits=4, log_quant_scheme='BitLog2_Single_16') |
| 2 | +Building dataloader ... |
| 3 | +Building model ... |
| 4 | +Performing initial quantization ... |
| 5 | +self.delta: 22492.0 |
| 6 | +16 tensor([-100000, 0, 10, 20, 30, 40, 50, 60, |
| 7 | + 70, 80, 90, 100, 110, 120, 130, 140], |
| 8 | + device='cuda:0', dtype=torch.int32) |
| 9 | +16 tensor([0.0000e+00, 1.0000e+00, 2.0000e+00, 4.0000e+00, 8.0000e+00, 1.6000e+01, |
| 10 | + 3.2000e+01, 6.4000e+01, 1.2800e+02, 2.5600e+02, 5.1200e+02, 1.0240e+03, |
| 11 | + 2.0480e+03, 4.0960e+03, 8.1920e+03, 1.6384e+04], device='cuda:0') |
| 12 | +16 tensor([0.0000e+00, 4.4460e-05, 8.8921e-05, 1.7784e-04, 3.5568e-04, 7.1136e-04, |
| 13 | + 1.4227e-03, 2.8455e-03, 5.6909e-03, 1.1382e-02, 2.2764e-02, 4.5527e-02, |
| 14 | + 9.1055e-02, 1.8211e-01, 3.6422e-01, 7.2844e-01], device='cuda:0') |
| 15 | +self.delta: 24500.0 |
| 16 | +16 tensor([-100000, 0, 10, 20, 30, 40, 50, 60, |
| 17 | + 70, 80, 90, 100, 110, 120, 130, 140], |
| 18 | + device='cuda:0', dtype=torch.int32) |
| 19 | +16 tensor([0.0000e+00, 1.0000e+00, 2.0000e+00, 4.0000e+00, 8.0000e+00, 1.6000e+01, |
| 20 | + 3.2000e+01, 6.4000e+01, 1.2800e+02, 2.5600e+02, 5.1200e+02, 1.0240e+03, |
| 21 | + 2.0480e+03, 4.0960e+03, 8.1920e+03, 1.6384e+04], device='cuda:0') |
| 22 | +16 tensor([0.0000e+00, 4.0816e-05, 8.1633e-05, 1.6327e-04, 3.2653e-04, 6.5306e-04, |
| 23 | + 1.3061e-03, 2.6122e-03, 5.2245e-03, 1.0449e-02, 2.0898e-02, 4.1796e-02, |
| 24 | + 8.3592e-02, 1.6718e-01, 3.3437e-01, 6.6873e-01], device='cuda:0') |
| 25 | +self.delta: 24528.0 |
| 26 | +16 tensor([-100000, 0, 10, 20, 30, 40, 50, 60, |
| 27 | + 70, 80, 90, 100, 110, 120, 130, 140], |
| 28 | + device='cuda:0', dtype=torch.int32) |
| 29 | +16 tensor([0.0000e+00, 1.0000e+00, 2.0000e+00, 4.0000e+00, 8.0000e+00, 1.6000e+01, |
| 30 | + 3.2000e+01, 6.4000e+01, 1.2800e+02, 2.5600e+02, 5.1200e+02, 1.0240e+03, |
| 31 | + 2.0480e+03, 4.0960e+03, 8.1920e+03, 1.6384e+04], device='cuda:0') |
| 32 | +16 tensor([0.0000e+00, 4.0770e-05, 8.1539e-05, 1.6308e-04, 3.2616e-04, 6.5232e-04, |
| 33 | + 1.3046e-03, 2.6093e-03, 5.2185e-03, 1.0437e-02, 2.0874e-02, 4.1748e-02, |
| 34 | + 8.3496e-02, 1.6699e-01, 3.3399e-01, 6.6797e-01], device='cuda:0') |
| 35 | +self.delta: 21922.0 |
| 36 | +16 tensor([-100000, 0, 10, 20, 30, 40, 50, 60, |
| 37 | + 70, 80, 90, 100, 110, 120, 130, 140], |
| 38 | + device='cuda:0', dtype=torch.int32) |
| 39 | +16 tensor([0.0000e+00, 1.0000e+00, 2.0000e+00, 4.0000e+00, 8.0000e+00, 1.6000e+01, |
| 40 | + 3.2000e+01, 6.4000e+01, 1.2800e+02, 2.5600e+02, 5.1200e+02, 1.0240e+03, |
| 41 | + 2.0480e+03, 4.0960e+03, 8.1920e+03, 1.6384e+04], device='cuda:0') |
| 42 | +16 tensor([0.0000e+00, 4.5616e-05, 9.1233e-05, 1.8247e-04, 3.6493e-04, 7.2986e-04, |
| 43 | + 1.4597e-03, 2.9194e-03, 5.8389e-03, 1.1678e-02, 2.3356e-02, 4.6711e-02, |
| 44 | + 9.3422e-02, 1.8684e-01, 3.7369e-01, 7.4738e-01], device='cuda:0') |
| 45 | +self.delta: 23644.0 |
| 46 | +16 tensor([-100000, 0, 10, 20, 30, 40, 50, 60, |
| 47 | + 70, 80, 90, 100, 110, 120, 130, 140], |
| 48 | + device='cuda:0', dtype=torch.int32) |
| 49 | +16 tensor([0.0000e+00, 1.0000e+00, 2.0000e+00, 4.0000e+00, 8.0000e+00, 1.6000e+01, |
| 50 | + 3.2000e+01, 6.4000e+01, 1.2800e+02, 2.5600e+02, 5.1200e+02, 1.0240e+03, |
| 51 | + 2.0480e+03, 4.0960e+03, 8.1920e+03, 1.6384e+04], device='cuda:0') |
| 52 | +16 tensor([0.0000e+00, 4.2294e-05, 8.4588e-05, 1.6918e-04, 3.3835e-04, 6.7670e-04, |
| 53 | + 1.3534e-03, 2.7068e-03, 5.4136e-03, 1.0827e-02, 2.1655e-02, 4.3309e-02, |
| 54 | + 8.6618e-02, 1.7324e-01, 3.4647e-01, 6.9295e-01], device='cuda:0') |
| 55 | +self.delta: 24428.0 |
| 56 | +16 tensor([-100000, 0, 10, 20, 30, 40, 50, 60, |
| 57 | + 70, 80, 90, 100, 110, 120, 130, 140], |
| 58 | + device='cuda:0', dtype=torch.int32) |
| 59 | +16 tensor([0.0000e+00, 1.0000e+00, 2.0000e+00, 4.0000e+00, 8.0000e+00, 1.6000e+01, |
| 60 | + 3.2000e+01, 6.4000e+01, 1.2800e+02, 2.5600e+02, 5.1200e+02, 1.0240e+03, |
| 61 | + 2.0480e+03, 4.0960e+03, 8.1920e+03, 1.6384e+04], device='cuda:0') |
| 62 | +16 tensor([0.0000e+00, 4.0937e-05, 8.1873e-05, 1.6375e-04, 3.2749e-04, 6.5499e-04, |
| 63 | + 1.3100e-03, 2.6199e-03, 5.2399e-03, 1.0480e-02, 2.0960e-02, 4.1919e-02, |
| 64 | + 8.3838e-02, 1.6768e-01, 3.3535e-01, 6.7071e-01], device='cuda:0') |
| 65 | +self.delta: 24110.0 |
| 66 | +16 tensor([-100000, 0, 10, 20, 30, 40, 50, 60, |
| 67 | + 70, 80, 90, 100, 110, 120, 130, 140], |
| 68 | + device='cuda:0', dtype=torch.int32) |
| 69 | +16 tensor([0.0000e+00, 1.0000e+00, 2.0000e+00, 4.0000e+00, 8.0000e+00, 1.6000e+01, |
| 70 | + 3.2000e+01, 6.4000e+01, 1.2800e+02, 2.5600e+02, 5.1200e+02, 1.0240e+03, |
| 71 | + 2.0480e+03, 4.0960e+03, 8.1920e+03, 1.6384e+04], device='cuda:0') |
| 72 | +16 tensor([0.0000e+00, 4.1477e-05, 8.2953e-05, 1.6591e-04, 3.3181e-04, 6.6363e-04, |
| 73 | + 1.3273e-03, 2.6545e-03, 5.3090e-03, 1.0618e-02, 2.1236e-02, 4.2472e-02, |
| 74 | + 8.4944e-02, 1.6989e-01, 3.3978e-01, 6.7955e-01], device='cuda:0') |
| 75 | +self.delta: 24275.0 |
| 76 | +16 tensor([-100000, 0, 10, 20, 30, 40, 50, 60, |
| 77 | + 70, 80, 90, 100, 110, 120, 130, 140], |
| 78 | + device='cuda:0', dtype=torch.int32) |
| 79 | +16 tensor([0.0000e+00, 1.0000e+00, 2.0000e+00, 4.0000e+00, 8.0000e+00, 1.6000e+01, |
| 80 | + 3.2000e+01, 6.4000e+01, 1.2800e+02, 2.5600e+02, 5.1200e+02, 1.0240e+03, |
| 81 | + 2.0480e+03, 4.0960e+03, 8.1920e+03, 1.6384e+04], device='cuda:0') |
| 82 | +16 tensor([0.0000e+00, 4.1195e-05, 8.2389e-05, 1.6478e-04, 3.2956e-04, 6.5911e-04, |
| 83 | + 1.3182e-03, 2.6365e-03, 5.2729e-03, 1.0546e-02, 2.1092e-02, 4.2183e-02, |
| 84 | + 8.4367e-02, 1.6873e-01, 3.3747e-01, 6.7493e-01], device='cuda:0') |
| 85 | +self.delta: 24151.0 |
| 86 | +16 tensor([-100000, 0, 10, 20, 30, 40, 50, 60, |
| 87 | + 70, 80, 90, 100, 110, 120, 130, 140], |
| 88 | + device='cuda:0', dtype=torch.int32) |
| 89 | +16 tensor([0.0000e+00, 1.0000e+00, 2.0000e+00, 4.0000e+00, 8.0000e+00, 1.6000e+01, |
| 90 | + 3.2000e+01, 6.4000e+01, 1.2800e+02, 2.5600e+02, 5.1200e+02, 1.0240e+03, |
| 91 | + 2.0480e+03, 4.0960e+03, 8.1920e+03, 1.6384e+04], device='cuda:0') |
| 92 | +16 tensor([0.0000e+00, 4.1406e-05, 8.2812e-05, 1.6562e-04, 3.3125e-04, 6.6250e-04, |
| 93 | + 1.3250e-03, 2.6500e-03, 5.3000e-03, 1.0600e-02, 2.1200e-02, 4.2400e-02, |
| 94 | + 8.4800e-02, 1.6960e-01, 3.3920e-01, 6.7840e-01], device='cuda:0') |
| 95 | +self.delta: 24589.0 |
| 96 | +16 tensor([-100000, 0, 10, 20, 30, 40, 50, 60, |
| 97 | + 70, 80, 90, 100, 110, 120, 130, 140], |
| 98 | + device='cuda:0', dtype=torch.int32) |
| 99 | +16 tensor([0.0000e+00, 1.0000e+00, 2.0000e+00, 4.0000e+00, 8.0000e+00, 1.6000e+01, |
| 100 | + 3.2000e+01, 6.4000e+01, 1.2800e+02, 2.5600e+02, 5.1200e+02, 1.0240e+03, |
| 101 | + 2.0480e+03, 4.0960e+03, 8.1920e+03, 1.6384e+04], device='cuda:0') |
| 102 | +16 tensor([0.0000e+00, 4.0669e-05, 8.1337e-05, 1.6267e-04, 3.2535e-04, 6.5070e-04, |
| 103 | + 1.3014e-03, 2.6028e-03, 5.2056e-03, 1.0411e-02, 2.0822e-02, 4.1645e-02, |
| 104 | + 8.3289e-02, 1.6658e-01, 3.3316e-01, 6.6631e-01], device='cuda:0') |
| 105 | +self.delta: 24586.0 |
| 106 | +16 tensor([-100000, 0, 10, 20, 30, 40, 50, 60, |
| 107 | + 70, 80, 90, 100, 110, 120, 130, 140], |
| 108 | + device='cuda:0', dtype=torch.int32) |
| 109 | +16 tensor([0.0000e+00, 1.0000e+00, 2.0000e+00, 4.0000e+00, 8.0000e+00, 1.6000e+01, |
| 110 | + 3.2000e+01, 6.4000e+01, 1.2800e+02, 2.5600e+02, 5.1200e+02, 1.0240e+03, |
| 111 | + 2.0480e+03, 4.0960e+03, 8.1920e+03, 1.6384e+04], device='cuda:0') |
| 112 | +16 tensor([0.0000e+00, 4.0674e-05, 8.1347e-05, 1.6269e-04, 3.2539e-04, 6.5078e-04, |
| 113 | + 1.3016e-03, 2.6031e-03, 5.2062e-03, 1.0412e-02, 2.0825e-02, 4.1650e-02, |
| 114 | + 8.3299e-02, 1.6660e-01, 3.3320e-01, 6.6640e-01], device='cuda:0') |
| 115 | +self.delta: 24545.0 |
| 116 | +16 tensor([-100000, 0, 10, 20, 30, 40, 50, 60, |
| 117 | + 70, 80, 90, 100, 110, 120, 130, 140], |
| 118 | + device='cuda:0', dtype=torch.int32) |
| 119 | +16 tensor([0.0000e+00, 1.0000e+00, 2.0000e+00, 4.0000e+00, 8.0000e+00, 1.6000e+01, |
| 120 | + 3.2000e+01, 6.4000e+01, 1.2800e+02, 2.5600e+02, 5.1200e+02, 1.0240e+03, |
| 121 | + 2.0480e+03, 4.0960e+03, 8.1920e+03, 1.6384e+04], device='cuda:0') |
| 122 | +16 tensor([0.0000e+00, 4.0741e-05, 8.1483e-05, 1.6297e-04, 3.2593e-04, 6.5186e-04, |
| 123 | + 1.3037e-03, 2.6075e-03, 5.2149e-03, 1.0430e-02, 2.0860e-02, 4.1719e-02, |
| 124 | + 8.3439e-02, 1.6688e-01, 3.3375e-01, 6.6751e-01], device='cuda:0') |
| 125 | +Performing scale reparameterization ... |
| 126 | +Validating ... |
| 127 | +Test: [0/250] Time 4.031 (4.031) Loss 0.5960 (0.5960) Prec@1 89.500 (89.500) Prec@5 99.000 (99.000) |
| 128 | +Test: [100/250] Time 1.841 (1.864) Loss 1.4360 (0.9697) Prec@1 68.500 (81.079) Prec@5 89.500 (95.277) |
| 129 | +Test: [200/250] Time 1.840 (1.852) Loss 0.6625 (1.1916) Prec@1 87.500 (76.239) Prec@5 98.500 (92.348) |
| 130 | + * Prec@1 75.458 Prec@5 92.044 Time 462.533 |
0 commit comments