2 IEEE TRANSACTIONS ON PATTERN ANALYSIS AND MACHINE INTELLIGENCE, VOL. 0, NO. 0, MAY 2021
*7!(%&",7*%5!K$&"(6Q&(6*"F!a!ℎ × 𝑤!4*"2*'$(6*"!'&;#%!-8%&;0!
6,!4*"2#%(#<!(*!&!9&6%!*7!3&,6,!-3'$#0!&"<!(%&",7*%5!<*5&6"!
-*%&"8#0!4*"2*'$(6*"&'!'&;#%,!-&0=!(1#"!(1#!9&6%!K$&"(6Q#<!(*!
%&(#S<6,(*%(6*"! *9(65$5! 36(H<#9(1,! -30F! Z"! (1#! &3,#"4#! *7!
K$&"(6Q&(6*"=!4*59*,6"8!(1#!5&996"8,!*7!(16,!9&6%!*7!'&;#%,!
%#4*2#%,!-*%!,;"(1#,6Q#,0!(1#!*%686"&'!*"#F!_68"&'!9%*4#,,6"8!
'6(#%&($%#!$,#,!(1#!(#%5!c(%&",7*%5!4*<6"8d!5*%#!4*55*"';!
(1&"!(%&",7*%5!K$&"(6Q&(6*"F!V*)#2#%=!)#!&<*9(! (1#!'&:#%!
(#%5!6"!(16,!)*%+!(*!,(%#,,!*$%!7*4$,!*"!K$&"(6Q&(6*"!%&(1#%!
(1&"!-#"(%*9;0!4*<6"8=!)1641!)#!&<<%#,,!6"!*$%!,#K$#'F!
! O$%!5&6"!4*"(%63$(6*",!&%#!&,!7*''*),F!X6%,(=!)#!9%*9*,#!
(%&",7*%5!K$&"(6Q&(6*"!7*%!4*59%#,,6"8!.//!)#681(,b)#!
&%#!(1#!>%,(!(*!4*",6<#%!K$&"(6Q&(6*"!*7!(%&",7*%5#<!)#681(,!
&"<!3&,6,=!&"<!*9(656Q#!3*(1!9*,(H(%&6"6"8F!_#4*"<=!)#!862#!
&!(1#*%;!*7!%&(#!&"<!<6,(*%(6*"!7*%!.//!K$&"(6Q&(6*"=!3&,#<!
*"!)1641!(%&",7*%5!4*<6"8!8&6",!4&"!3#!4*59$(#<F!G#!(1#"!
<#%62#!&"!#"<H(*H#"<H'#&%"#<!(%&",7*%5!(1&(!5&Y656Q#,!(1#!
8&6",F!\16%<=!)#!&<2&"4#!(1#!,(&(#!*7!(1#!&%(!6"!4*59%#,,6*"!
*7!.//,=!6"!3*(1!%#(%&6"#<!&"<!"*"H%#(%&6"#<!,4#"&%6*,=!7*%!
65&8#!4'&,,6>4&(6*"ba'#Y/#(!?@A=!P#,/#(,!?LTA=![#",#/#(,!
?L@A=!&"<!7*%!'*)H'#2#'!26,6*"!(&,+,=![Pe/#(!-<#"*6,6"80!?LBA!
&"<!M[_P!-,$9#%H%#,*'$(6*"0!?LCAF!
2 RELATED WORK
.//!4*59%#,,6*"!5#(1*<,!3&,#<!*"!9%$"6"8!?RSBTA!"$''67;!
+#%"#',!?RS@CA=!41&""#',!?@DS@RA=!*%!#2#"!6"<626<$&'!)#681(,!
?@USBTA!(1&(!&%#!6",68"6>4&"(!&44*%<6"8!(*!,$41!4%6(#%6&!&,!&!
"*%5!?RS^A!*%!,*5#!*3W#4(62#!7$"4(6*"!?@UAF!V*)#2#%=!)16'#!
&!7#)!5#(1*<,!?BTA!4*59%#,,!(1#!9%$"#<!)#681(,!7$%(1#%!26&!
K$&"(6Q&(6*"!&"<!2&%6&3'#H'#"8(1!-V$J5&"0!4*<6"8=!*9(65&'!
K$&"(6Q&(6*"!*7!9%$"#<!"#()*%+,!8#"#%&'';!%#5&6",!&"!*9#"!
9%*3'#5F!N*%#*2#%=!(1#!9%$"6"8!4%6(#%6&!&%#!*7(#"!41*,#"!6"!
&!1#$%6,(64!5&""#%!&8"*,(64!(*!(1#!&4($&'!&44$%&4;!'*,,#,F!f;!
4*"(%&,(=! *$%! (%&",7*%5HK$&"(6Q&(6*"! 7%&5#)*%+! K$&"(6Q#,!
(*!Q#%*!-6F#F!9%$"#,0!+#%"#',!)1641!&%#!<##5#<!6",68"6>4&"(!
&44*%<6"8!(*!36(H<#9(1S&44$%&4;!*9(65&'6(;!4%6(#%6&F!
! .*"(#59*%&"#*$,!)6(1!(1#!9%$"6"8H3&,#<!(#41"6K$#,!7*%!
.//!4*59%#,,6*"=!,*5#!%#,#&%41#%,!9%*9*,#<!(*!4*59%#,,!
.//,!>%,(!3;!,9&(6&'';!<#4*%%#'&(6"8!(1#6%!)#681(,!)6(1!(1#!
[.\=!7*''*)#<!3;!2#4(*%!K$&"(6Q&(6*"!?BDA!*%!1&,16"8!?BLA!*7!
(1#!<#4*%%#'&(#<!)#681(,!(*!7$%(1#%!%#<$4#!(1#!%#<$"<&"46#,!
&4%*,,!(1#!(%&",7*%5#<!+#%"#',F!\1#,#!(%&",7*%5!&99%*&41#,!
&%#=!1*)#2#%=!&99'64&3'#!(*!(1#!4*59%#,,6*"!*7!4*"2*'$(6*"!
+#%"#',!*"';=!4*59$(&(6*"&'';!4*59'#Y!<$#!(*!(1#!4'$,(#%6"8!
6"2*'2#<!?BDA=!*%!4&41#H6"#I46#"(!<$#!(*!$,6"8!1&,1(&3'#,!&,!
(1#!5&6"!<&(&!,(%$4($%#!?BLAF!N*%#*2#%=!,*5#!.//!5*<#',!
4*"(&6"!'&%8#!"$53#%,!*7!1 × 1!4*"2*'$(6*"&'!+#%"#',=!)1#%#!
(1#!3#"#>(!*7!,9&(6&'!<#4*%%#'&(6*"!*7!+#%"#',!26&!(1#![.\!6,!
'#,,!,68"6>4&"(F!Z"!4*"(%&,(!)6(1!(1#!,9&(6&'H(%&",7*%5H3&,#<!
&99%*&41#,=!*$%!K$&"(6Q&(6*"!7%&5#)*%+!(%&",7*%5,!&4%*,,!
-%&(1#%!(1&"!)6(16"0!+#%"#',!(*!9%*26<#!(1#!4*59%#,,6*"!&"<!
#I46#"4;!8&6",!#2#"!7*%!,5&''#%!4*"2*'$(6*"!+#%"#',F!
! Z"!9&%&''#'!)6(1!(1#![.\!(#41"6K$#,!&3*2#=!*(1#%!&$(1*%,!
,*$81(!(*!%#<$4#!(1#!<65#",6*"&'6(;!*7!.//!'&;#%,!26&!`.a!
&"<!%#'&(#<!(#41"6K$#,!?DRSELAF![#"(*"!#(!&'F!?DRA!&99';!(1#!!
_][!&4%*,,!+#%"#',!6"!4*"2*'$(6*"!'&;#%,=!*%!&4%*,,!(1#!%*),!
&"<!4*'$5",!*7!)#681(!5&(%64#,!7*%!7$'';H4*""#4(6"8!'&;#%,!
(*!9%*W#4(!6"9$(!*%!*$(9$(!(*!'*)H%&"+!,$3,9&4#,=!9%*26<6"8!
4*59$(&(6*"&'!,&26"8,!<$%6"8!(1#!6"7#%#"4#!,(&8#F!g1&"8!#(!
&'F!?E@A!#Y(#"<!(16,!5#(1*<!3;!$,6"8!(1#!8#"#%&'6Q#<!_][!(*!
(&+#!6"(*!&44*$"(!(1#!9%#,#"4#!*7!P#he!&4(62&(6*",!3#()##"!
,$44#,,62#!'&;#%,F!\16,!)*%+!)&,!#Y(#"<#<!6"!($%"!3;!i65!#(!
&'F!?EBA=!)1*!&99';!(1#!_][!*"!&''!7*$%!&Y#,!*7!4*"2*'$(6*"&'!
(#",*%,F!h6!#(!&'F!?D^A!#Y(#"<!(1#!)*%+!*7!?E@A!3;!9&%(6(6*"6"8!
(1#!+#%"#',!6"(*!,$3,#(,=!(1#"!$,6"8!(1#!_][!*"!#&41!,$3,#(!
*7!+#%"#',!,#9&%&(#';F!V*)#2#%=!`.aH3&,#<!4*59%#,,6*"!6,!
"*(!4*"4#%"#<!)6(1!K$&"(6Q&(6*"=!,*!*9(65&'!K$&"(6Q&(6*"!*7!
(1#!9%*W#4(#<!"#()*%+!%#5&6",!&"!*9#"!9%*3'#5F!a',*=!`.a!
5#(1*<,! <#(#%56"#!(1#!9%*W#4(6*"!<65#",6*",!1#$%6,(64&'';!
$,6"8!<#4*%%#'&(#<!)#681(!2&%6&"4#,!?E@=!EBA=!3;!56"656Q6"8!
&!'#&,(H,K$&%#,!4%6(#%6*"!?ETA!*%!$,6"8!<65#",6*"!&,,68"5#"(!
%$'#,!?EDA=!"*"#!*7!)1641!%#j#4(!(1#!&4($&'!'*,,!*7!9%#<64(6*"!
&44$%&4;!<$#!(*!(1#!9%*W#4(6*",F!f;!4*"(%&,(=!*$%!7%&5#)*%+!
<#(#%56"#,!(1#!K$&"(6Q&(6*"!36(H<#9(1,!&"<!(1#6%!&,,*46&(#<!
9%*W#4(6*"!<65#",6*",!(*!56"656Q#!(1#!9#%7*%5&"4#!'*,,!&(!&!
862#"!K$&"(6Q&(6*"!36(H%&(#!-&2#%&8#!36(H<#9(10F!
! k$&"(6Q&(6*"!5#(1*<,!-3*(1!2#4(*%!&"<!,4&'&%0!7*%!.//,!
?BTSDLA!1&2#!<#2#'*9#<!&'*"8,6<#!9%$"6"8!5#(1*<,F!]#4(*%!
K$&"(6Q&(6*"!*7!)#681(,!?BBSBLA!6"2*'2#,!𝑘H5#&",!?BBSBDA!*%!
&!c1&,16"8!(%64+d!?BE=!BLA!&"<!5&;!&<<6(6*"&'';!6"2*'2#!(1#!
[.\!?BD=!BLA!&"<!%#,6<$&'!K$&"(6Q&(6*"!?BBAF!e"67*%5!,4&'&%!
K$&"(6Q&(6*"!*7!)#681(,!(*!*"#!36(!-36"&%;!%#9%#,#"(&(6*"0!6,!
9%*9*,#<!3;!V$3&%&!#(!&'F!?C@=!D@A=!&"<!(*!()*!36(,!-(#%"&%;0!
3;!g1$!#(!&'F!?CTAF!hkH/#(,!?CRA!'#&%"!(1#!*9(65&'!K$&"(6Q#%,!
<$%6"8!(%&6"6"8!&(!&!,9#46>#<!36(H<#9(1F!/*"H$"67*%5!,4&'&%!
K$&"(6Q&(6*"!)&,!9%*9*,#<!3;!\$"8!&"<!N*%6!?B@A=!)1#%#&,!
g1*$!#(!&'F!?CLA!<#5*",(%&(#!(1&(!)#!4&"!K$&"(6Q#!"#()*%+,!
9*,(H(%&6"6"8=!9%*26<#<!(1&(!)#681(,!4&"!3#!%#>"#<!3;!,*5#!
&<<6(6*"&'!(%&6"6"8!&7(#%!K$&"(6Q6"8!-)#!%#7#%!(*!(16,!9%*4#,,!
&,!%#H(%&6"6"80F!P#4#"(!5#(1*<,!?CU=!DCA!9%*9*,#!(*!K$&"(6Q#!
"#()*%+,!6"!&!(%&6"6"8H7%##!5&""#%=!3&,#<!*"!&!9#%H41&""#'!
36(H<#9(1!&''*4&(6*"!9&%&<685!?CUA=!*%!3;!#K$&'6Q6"8!)#681(,!
&"<!4*%%#4(6"8!36&,#,!?DCAF!G#!#Y(#"<!9#%H41&""#'!36(H<#9(1!
&''*4&(6*"!&"<!%#H(%&6"6"8!(*!(1#!(%&",7*%5!<*5&6"F!
! [#,68"6"8!'681()#681(!.//,!,$41!&,!N*36'#/#(!?LDA!&"<!
_K$##Q#/#(!?LEA!6,!&"*(1#%!7*%5!*7!5*<#'!4*59%#,,6*"F!O"#!
4&"!%#'&(#!(1#!<#9(1)6,#!4*"2*'$(6*"!'&;#%,!*7!?LDA!(*!9#%7#4(!
Fig. 1. Transform quantization of CNN layers. Given weight matrices Θ
1
2
L
of an L-layer CNN, we represent each one as Θ
l
l
l
(a) and
quantize both the kernel matrix
T
l
and the basis S
l
optimally (b). In (b), the bar lengths illustrate the bit-depths needed to quantize Θ
l
S
l
T
l
in the transform domain (blue and orange bars) for the same performance. Elements corresponding to zero bit-depth assignments
(R
k
0) are indicated as white blocks in (a).