@techreport{oai:ipsj.ixsq.nii.ac.jp:00217101,
 author = {Yi, Ng Kuan and Aalaa, M.A. Babai and Satoshi, Kawakami and Teruo, Tanimoto and Koji, Inoue and Yi, Ng Kuan and Aalaa, M.A. Babai and Satoshi, Kawakami and Teruo, Tanimoto and Koji, Inoue},
 issue = {13},
 month = {Mar},
 note = {Intermittent executions and energy harvesting technologies are promising candidates to enable renewable energy on small-scale computer systems like single-board computers, making sustainable computing possible. In this work, we implemented an energy consumption prediction framework for each layer of CNN executing on single-board computers based on NeuralPower as the first step towards enabling energy-efficient intermittent execution of CNN inference on single-board computers. We found that layer hyperparameters cannot explain all the variations in execution time and power consumption when the layer is executed. Model's prediction can be improved with the knowledge of performance counter values, but these values are not available before a layer is executed. Furthermore, our analysis revealed that implementation optimization like sparse matrix multiplication might cause a layer's execution time and power to change with its input values., Intermittent executions and energy harvesting technologies are promising candidates to enable renewable energy on small-scale computer systems like single-board computers, making sustainable computing possible. In this work, we implemented an energy consumption prediction framework for each layer of CNN executing on single-board computers based on NeuralPower as the first step towards enabling energy-efficient intermittent execution of CNN inference on single-board computers. We found that layer hyperparameters cannot explain all the variations in execution time and power consumption when the layer is executed. Model's prediction can be improved with the knowledge of performance counter values, but these values are not available before a layer is executed. Furthermore, our analysis revealed that implementation optimization like sparse matrix multiplication might cause a layer's execution time and power to change with its input values.},
 title = {Layer-wise power/performance modelling for single-board CNN inference},
 year = {2022}
}