People
Research
High-Performance Computing
Energy-Efficient Computing
Energy-Efficient Communications
Applications
Publications
Education
Engineering Degree
Master's Degree
Ph.D. Degree
Projects
Academia
Industry
Publications
Home
/
Research
/
Publications
% --- ANO 2024 --- @ARTICLE{10579818, author={Alves, Alex C. R. and Silveira, Luiz F. Q. and Kreutz, Márcio E. and Dias, Samaherni M.}, journal={IEEE Access}, title={A Parity-Based Dual Modular Redundancy Approach for the Reliability of Data Transmission in Nanosatellite’s Onboard Processing}, year={2024}, pages={1-1}, url = {https://ieeexplore.ieee.org/document/10579818} } @article{SANTANA2024105662, title = {DeLIA: A Dependability Library for Iterative Applications applied to parallel geophysical problems}, journal = {Computers & Geosciences}, pages = {105662}, year = {2024}, issn = {0098-3004}, doi = {https://doi.org/10.1016/j.cageo.2024.105662}, url = {https://www.sciencedirect.com/science/article/pii/S0098300424001456}, author = {Carla Santana and Ramon C.F. Araújo and Idalmis Milian Sardina and Ítalo A.S. {de Assis} and Tiago Barros and Calebe P. Bianchini and Antonio D. de S. Oliveira and João M. {de Araújo} and Hervé Chauris and Claude Tadonki and Samuel Xavier-de-Souza}, } @inproceedings{Assis2024, title = {Automatic Workload Scheduling for Full Waveform Inversion in Shared-Memory Systems}, author = {Italo Assis and Felipe Silva and Joao Fernandes and Idalmis Sardina and Tiago Barros and Samuel Xavier-De-Souza}, year = {2024}, booktitle = {Proc. Energy High Performance Computing Conference}, organization = {Rice Ken Kennedy Institute}, url = {https://www.energyhpc.rice.edu/_files/ugd/f0e64b_144054f921ba4faa9ca08fb789390f7b.pdf} } @ARTICLE{10029876, author={Nascimento, Diego V. Cirilo do and Georgiou, Kyriakos and Eder, Kerstin I. and Xavier-de-Souza, Samuel}, journal={IEEE Embedded Systems Letters}, title={Evaluating the Effects of Reducing Voltage Margins for Energy-Efficient Operation of MPSoCs}, url = {https://ieeexplore.ieee.org/document/10029876}, year={2024}, volume={16}, number={1}, pages={25-28}, doi={10.1109/LES.2023.3240625}, ISSN={1943-0671}, month={March} } @article{FERNANDES2024101789, title = {PATSMA: Parameter Auto-tuning for Shared Memory Algorithms}, journal = {SoftwareX}, volume = {27}, pages = {101789}, year = {2024}, issn = {2352-7110}, doi = {https://doi.org/10.1016/j.softx.2024.101789}, url = {https://www.sciencedirect.com/science/article/pii/S2352711024001602}, author = {Joao B. Fernandes and Felipe H. Santos-da-Silva and Tiago Barros and Italo A.S. Assis and Samuel Xavier-de-Souza} } % --- ANO 2023 --- @inproceedings{ENCOM2023-69, author = {Eduardo N. Velloso and L. F. Silveira}, title = {Estimação de Canal MU-MIMO por Redes Recorrentes com Ajuste de Memória}, booktitle = {Anais da XIII Conferência Nacional em Comunicações, Redes e Segurança da Informação}, publisher = {ENCOM}, year = {2023}, pages = {69-70}, url = {https://www.iecom.org.br/encom2023/autores.html#anais} } @inproceedings{ENCOM2023-61, author = {Antônio A. Feitas Júnior and Agostinho de M. Brito Júnior and L. F. Silveira}, title = {Detecção de Ataques DDoS com Base em Métricas de Tráfego Usando Viola-Jones}, booktitle = {Anais da XIII Conferência Nacional em Comunicações, Redes e Segurança da Informação}, publisher = {ENCOM}, year = {2023}, pages = {61-62}, url = {https://www.iecom.org.br/encom2023/autores.html#anais} } @inproceedings{CBIC2023-157, author = {A. A. {Freitas Junior} and F. S. {Lima Filho} and A. M. {Brito Junior} and L. F. Silveira}, title = {Detecção de Ataques DDoS com Base em Métricas de Tráfego usando Redes Convolucionais}, pages = {1-7}, booktitle = {Anais do XVI Congresso Brasileiro de Inteligência Computacional ({CBIC}'2023)}, editor = {E. Simas and D. D. Ferreira and L. R. Oliveira}, publisher = {SBIC}, year = {2023}, url = {https://sbic.org.br/eventos/cbic_2023/cbic2023-157/} } @article{Velloso_2023, doi = {10.3847/2041-8213/acb8b4}, url = {https://dx.doi.org/10.3847/2041-8213/acb8b4}, year = {2023}, publisher = {The American Astronomical Society}, volume = {945}, number = {1}, pages = {L12}, author = {E. N. Velloso and F. Anthony and J.-D. do Nascimento and L. F. Q. Silveira and J. Hall and S. H. Saar}, title = {Multicomponent Activity Cycles Using Hilbert–Huang Analysis}, journal = {The Astrophysical Journal Letters} } @article{Costa2023, author = {Da Costa, C.A.N. and Gebre, M.G. and Barros, T. and Lopez, J.L. and De Araújo, J.M. and De Souza, S.X.}, title = {Improving repeatability of 4D OBN data using interferometry by regularized multidimensional deconvolution}, year = {2023}, pages = {1-5}, doi = {https://doi.org/10.3997/2214-4609.202310749}, url = {https://www.earthdoc.org/content/papers/10.3997/2214-4609.202310749}, journal = {European Association of Geoscientists & Engineers}, issn = {2214-4609} } @article {Santos20235314, title = {Adaptive Clustering of Users in Power Domain NOMA}, author = {Santos, Yuri P. and Silveira, Luiz F. Q.}, journal = {Sensors}, year = {2023}, url = {https://www.mdpi.com/1424-8220/23/11/5314} } @Article{e25030503, AUTHOR = {Avila, Anderson and Santos, Helida and Cruz, Anderson and Xavier-de-Souza, Samuel and Lucca, Giancarlo and Moura, Bruno and Yamin, Adenauer and Reiser, Renata}, TITLE = {HybriD-GM: A Framework for Quantum Computing Simulation Targeted to Hybrid Parallel Architectures}, JOURNAL = {Entropy}, VOLUME = {25}, YEAR = {2023}, URL = {https://www.mdpi.com/1099-4300/25/3/503}, ISSN = {1099-4300}, DOI = {10.3390/e25030503} } @inproceedings{Miller2022, doi = {10.1130/abs/2022am-382380}, url = {https://doi.org/10.1130/abs/2022am-382380}, year = {2022}, publisher = {Geological Society of America}, author = {Raoul Miller and Samuel Xavier-de-Souza and Manjula Ranagalage and H.K.S. de Zoysa}, title = {Moving Geoinformatics workloads into the cloud: real-world examples of enabling collaborative research}, booktitle = {Geological Society of America Abstracts with Programs} } @inproceedings{Farias2022, doi = {10.1109/VLSI-SoC54400.2022.9939597}, url = {https://doi.org/10.1109/VLSI-SoC54400.2022.9939597}, year = {2022}, publisher = {}, author = {Farias, Johannes W. and Nascimento, Diego V. C. and Barros, Tiago and Xavier-de-Souza, Samuel}, title = {Speculative guardband: exploiting critical-delay variations across cached instructions}, booktitle = {2022 IFIP/IEEE 30th International Conference on Very Large Scale Integration (VLSI-SoC)} } @article{eage:/content/papers/10.3997/2214-4609.2022.80004, author = "Santana, C. and Sardina, I. and Xavier-de-Souza, S.", title = "Fault Tolerance Library for geophysical numerical methods", journal= "", year = "2022", volume = "2022", number = "1", pages = "1-5", doi = "https://doi.org/10.3997/2214-4609.2022.80004", url = "https://www.earthdoc.org/content/papers/10.3997/2214-4609.2022.80004", publisher = "European Association of Geoscientists & Engineers", issn = "2214-4609", type = "", } @inproceedings{sibgrapi_estendido, author = {Júlio Costa and Francinaldo Pereira and Davi Santos and Samuel Souza and Luiz Gonçalves}, title = { Data Modelless Microservices to increase Multi-Tenancy in BaaS and SaaS Providers with Application to a Covid-19 Data-Lake}, booktitle = {Anais Estendidos da XXXV Conference on Graphics, Patterns and Images}, location = {Natal/RN}, year = {2022}, keywords = {}, issn = {0000-0000}, pages = {177--182}, publisher = {SBC}, address = {Porto Alegre, RS, Brasil}, doi = {10.5753/sibgrapi.est.2022.23284}, url = {https://sol.sbc.org.br/index.php/sibgrapi_estendido/article/view/23284} } @article{ALVES2022108043, title = {Real-time wavelet-based adaptive algorithm for low inertia AC microgrids power measurements}, journal = {International Journal of Electrical Power \& Energy Systems}, volume = {140}, pages = {108043}, year = {2022}, issn = {0142-0615}, doi = {https://doi.org/10.1016/j.ijepes.2022.108043}, url = {https://www.sciencedirect.com/science/article/pii/S0142061522000862}, author = {Denis Keuton Alves and Ricardo Lúcio Araújo Ribeiro and Luiz Felipe de Queiroz Silveira and Thiago de Oliveira Alves Rocha}, keywords = {Frequency estimation, Power components, Reactive power, Real-time estimation, Wavelet transform}, abstract = {This paper proposes a real-time wavelet-based power estimator using a real-time modified stationary discrete wavelet packet transform (RT-MSDWPT). The proposed method overcomes the conventional SDWPT main constraints of power estimations related to the lack of reactive power flow direction and susceptibility to off-nominal frequency operation. The introduction of a digital sampling-shifting of a quarter of the fundamental, applied to the filtered voltages, assures the reactive power flow direction. Additionally, the insertion of an adaptive sampling time procedure based on the power grid frequency estimation mitigates the errors introduced by the network frequency deviations. These modifications make the RT-MSDWPT suitable for being embedded into the standard hierarchical power flow control strategies of ac microgrids. Experimental results assessed using an ac microgrid laboratory setup, operating under different operational scenarios, demonstrate the feasibility of the proposed solution.} } @Article{electronics11050689, AUTHOR = {da Silva, Vitor Ramos Gomes and da Silva, Anderson Bráulio Nóbrega and Valderrama, Carlos and Manneback, Pierre and Xavier-de-Souza, Samuel}, TITLE = {A Minimally Intrusive Approach for Automatic Assessment of Parallel Performance Scalability of Shared-Memory HPC Applications}, JOURNAL = {Electronics}, VOLUME = {11}, YEAR = {2022}, NUMBER = {5}, ARTICLE-NUMBER = {689}, URL = {https://www.mdpi.com/2079-9292/11/5/689}, ISSN = {2079-9292}, ABSTRACT = {High-performance computing systems have become increasingly dynamic, complex, and unpredictable. To help build software that uses full-system capabilities, performance measurement and analysis tools exploit extensive execution analysis focusing on single-run results. Despite being effective in identifying performance hotspots and bottlenecks, these tools are not sufficiently suitable to evaluate the overall scalability trends of parallel applications. Either they lack the support for combining data from multiple runs or collect excessive data, causing unnecessary overhead. In this work, we present a tool for automatically measuring and comparing several executions of a parallel application according to various scenarios characterized by the input arrangements, the number of threads, number of cores, and frequencies. Unlike other existing performance analysis tools, the proposed work covers some gaps in specialized features necessary to better understand computational resources scalability trends across configurations. In order to improve scalability analysis and productivity over the vast spectrum of possible configurations, the proposed tool features automatic instrumentation, direct mapping of parallel regions, accuracy-preserving data reductions, and ease of use. As it aims at accurately understanding scalability trends of parallel applications, detailed single-run performance analyses show minimal intrusion (less than 1\% overhead).}, DOI = {10.3390/electronics11050689} } @Article{en15031213, author = {Ramos Gomes da Silva, Vitor and Valderrama, Carlos and Manneback, Pierre and Xavier-de-Souza, Samuel}, title = {Analytical Energy Model Parametrized by Workload, Clock Frequency and Number of Active Cores for Share-Memory High-Performance Computing Applications}, journal = {Energies}, volume = {15}, year = {2022}, number = {3}, article-number = {1213}, url = {https://www.mdpi.com/1996-1073/15/3/1213}, issn = {1996-1073}, abstract = {Energy consumption is crucial in high-performance computing (HPC), especially to enable the next exascale generation. Hence, modern systems implement various hardware and software features for power management. Nonetheless, due to numerous different implementations, we can always push the limits of software to achieve the most efficient use of our hardware. To be energy efficient, the software relies on dynamic voltage and frequency scaling (DVFS), as well as dynamic power management (DPM). Yet, none have privileged information on the hardware architecture and application behavior, which may lead to energy-inefficient software operation. This study proposes analytical modeling for architecture and application behavior that can be used to estimate energy-optimal software configurations and provide knowledgeable hints to improve DVFS and DPM techniques for single-node HPC applications. Additionally, model parameters, such as the level of parallelism and dynamic power, provide insights into how the modeled application consumes energy, which can be helpful for energy-efficient software development and operation. This novel analytical model takes the number of active cores, the operating frequencies, and the input size as inputs to provide energy consumption estimation. We present the modeling of 13 parallel applications employed to determine energy-optimal configurations for several different input sizes. The results show that up to 70\% of energy could be saved in the best scenario compared to the default Linux choice and 14\% on average. We also compare the proposed model with standard machine-learning modeling concerning training overhead and accuracy. The results show that our approach generates about 10 times less energy overhead for the same level of accuracy.}, doi = {10.3390/en15031213} } @inproceedings{sadite2021parallel, author = {de Lima, Raffael S. C. G. and Duarte, Jose Marcelo L. and Nascimento, Diego V. Cirilo do and de Souza Filho, Reinaldo A. and Xavier-de-Souza, Samuel}, booktitle = {2021 XI Brazilian Symposium on Computing Systems Engineering (SBESC)}, doi = {10.1109/SBESC53686.2021.9628300}, pages = {1--8}, publisher = {European Association of Geoscientists \& Engineers}, title = {{A parallel software-defined ultra-low-power receiver for a satellite message forwarding system}}, url = {http://doi.org/10.1109/SBESC53686.2021.9628300}, year = {2021} } @article{ARAUJO2021boosting, title = {Boosting memory access locality of the Spectral Element Method with Hilbert space-filling curves}, journal = {Computers \& Geosciences}, pages = {104938}, year = {2021}, issn = {0098-3004}, doi = {https://doi.org/10.1016/j.cageo.2021.104938}, url = {https://www.sciencedirect.com/science/article/pii/S0098300421002260}, author = {Roger R.F. Araújo and Lutz Gross and Samuel Xavier-de-Souza}, keywords = {Hilbert space-filling curves, Spectral Element Method, Unstructured meshes, Acoustic waves, Wave propagation, Parallel processing}, abstract = {We propose an algorithm based on Hilbert space-filling curves to reorder mesh elements in memory for use with the Spectral Element Method, aiming to attain fewer cache misses, better locality of data reference and faster execution. We present a technique to numerically simulate acoustic wave propagation in 2D domains using the Spectral Element Method, and discuss computational performance aspects of this procedure. We reorder mesh-related data via Hilbert curves to achieve sizable reductions in execution time under several mesh configurations in shared-memory systems. Our experiments show that the Hilbert curve approach works well with meshes of several granularities and also with small and large variations in element sizes, achieving reductions between 9\% and 25\% in execution time when compared with three other ordering schemes.} } @inproceedings{Santana2021, author = {Santana, C. and Assis, {\'{I}}. and Barros, T. and Sardina, I. and Xavier-de-Souza, S.}, booktitle = {Digital Subsurface Conference in Latin America}, doi = {10.3997/2214-4609.202181013}, issn = {2214-4609}, month = {may}, number = {1}, pages = {1--5}, publisher = {European Association of Geoscientists \& Engineers}, title = {{Fault Tolerance Applied to 3D Full Waveform Inversion}}, url = {https://www.earthdoc.org/content/papers/10.3997/2214-4609.202181013}, volume = {2021}, year = {2021} } @Article{en14113161, AUTHOR = {Oliveira, Tadeu F. and Xavier-de-Souza, Samuel and Silveira, Luiz F.}, TITLE = {Improving Energy Efficiency on SDN Control-Plane Using Multi-Core Controllers}, JOURNAL = {Energies}, VOLUME = {14}, YEAR = {2021}, NUMBER = {11}, ARTICLE-NUMBER = {3161}, URL = {https://www.mdpi.com/1996-1073/14/11/3161}, ISSN = {1996-1073}, ABSTRACT = {Software-defined networks have become more common in data centers. The programmability of these networks is a great feature that allows innovation to be deployed fast, following the increasing number of new applications. This growth comes with a cost of more processing power and energy consumption. Many researchers have tackled this issue using existing routing techniques to dynamically adjust the network forwarding plane to save energy. On the control-plane, researchers have found algorithms for positioning the controller in a way to reduce the number of used links, thus reducing energy. These strategies reduce energy consumption at the expense of processing power of the controllers. This paper proposes a novel approach to energy efficiency focused on the network’s control-plane, which is complementary to the many already existing data-plane solutions. It takes advantage of the parallel processing capabilities of modern off-the-shelf multicore processors to split the many tasks of the controller among the cores. By dividing the tasks among homogeneous cores, one can lower the frequency of operations, lowering the overall energy consumption while keeping the same quality of service level. We show that a multicore controller can use an off-the-shelf multicore processor to save energy while keeping the level of service. We performed experiments based on standard network measures, namely latency and throughput, and standard energy efficiency metrics for data centers such as the Communication Network Energy Efficiency (CNEE) metric. Higher energy efficiency is achieved by a parallel implementation of the controller and lowering each core’s frequency of operation. In our experiments, we achieved a drop of 28\% on processor energy use for a constant throughput scenario when comparing with the single-core approach.}, DOI = {10.3390/en14113161} } @article{Araujo2021, abstract = {Sucker-rod pumping wells can be either vertical or directional. Over time, research efforts on the functioning of vertical wells led to a well-established set of mathematical models and practical tools. When it comes to directional wells, however, no general agreement has been reached, and the topic remains in active discussion. This paper revisits, extends, implements and optimizes an overlooked model, initially devised in 1995, whose computational complexity resulted in long processing times that stymied its adoption. This model fully utilizes the 3D trajectory of the rod string, allowing for the use of two viscous friction models and proposing its own formulation for downhole boundary conditions. The resulting model can be used to efficiently simulate the dynamic behavior of directional sucker-rod pumping wells taking into account the fluid flow inside the rod-tubing annulus. We present and analyze a serial and a parallel software implementation of this CPU-intensive model based on an explicit finite-difference method. We also describe our contributions to the accuracy and performance of the original model and software implementation. A rough approximation shows that the proposed serial version is about 200 times faster than the legacy original code, if we were to run the latter in a modern processor. On top of that our parallel implementation achieved a 6.5 $$\times $$ speedup over the serial version in a shared-memory system, making it a suitable tool for well design and optimization. The research contributes to the discussions on mathematical modeling of directional sucker-rod pumping wells, and illustrates how performance-focused techniques can enable the effective use of computationally demanding models to facilitate further refinements and applications.}, author = {Araújo, Roger R. F. and Xavier-de-Souza, Samuel}, doi = {10.1007/S13202-021-01161-X}, file = {:C\:/Users/samue/AppData/Local/Mendeley Ltd./Mendeley Desktop/Downloaded/Ara{\'{u}}jo, Xavier-de-Souza - 2021 - A simulation model for dynamic behavior of directional sucker-rod pumping wells implementation, analysi.pdf:pdf}, issn = {2190-0566}, journal = {Journal of Petroleum Exploration and Production 2021}, keywords = {Energy Systems,Geology,Industrial Chemistry/Chemical Engineering,Industrial and Production Engineering,Monitoring/Environmental Analysis,Offshore Engineering}, month = {may}, pages = {1--25}, publisher = {Springer}, title = {{A simulation model for dynamic behavior of directional sucker-rod pumping wells: implementation, analysis, and optimization}}, url = {https://link.springer.com/article/10.1007/s13202-021-01161-x}, year = {2021} } @article{BERNED2021101959, title = {Low learning-cost offline strategies for EDP optimization of parallel applications}, journal = {Journal of Systems Architecture}, volume = {114}, pages = {101959}, year = {2021}, issn = {1383-7621}, doi = {https://doi.org/10.1016/j.sysarc.2020.101959}, url = {https://www.sciencedirect.com/science/article/pii/S1383762120302101}, author = {Gustavo Paim Berned and Fábio D. Rossi and Marcelo C. Luizelli and Samuel Xavier {de Souza} and Antonio Carlos S. Beck and Arthur F. Lorenzon}, keywords = {Parallel Computing, Runtime optimization systems, Thread-level parallelism exploitation, Energy-delay product}, abstract = {Many parallel applications do not scale with the number of threads. Several online and offline strategies have been proposed in order to optimize this number. While the former strategy can capture some behaviors that can only be known at runtime, the latter do not impose any execution overhead and can use more complex and efficient algorithms. However, the learning algorithm in these offline strategies may take several hours, precluding their use or a smooth portability across different systems. In this scenario, we propose a methodology to decrease the learning time of offline strategies by inferring the execution behavior of parallel applications using smaller input sets than the ones used by the target applications. It implements two search strategies: SEA, where all parallel regions of an application run with the same number of threads; and SPRA, which seeks to find an ideal number of threads for each parallel region of a given application. With an extensive set of experiments, we show that SEA and SPRA strategies converge to results close to an offline approach applied over the regular input, but being 88\% and 87\% faster, on average, respectively. We also show that SPRA is better than SEA for unbalanced applications.} } @article{SOUZA2021107150, title = {High-Impedance Fault Identification Using Cyclostationary Characteristic Analysis}, journal = {Electric Power Systems Research}, volume = {195}, pages = {107150}, year = {2021}, issn = {0378-7796}, doi = {https://doi.org/10.1016/j.epsr.2021.107150}, url = {https://www.sciencedirect.com/science/article/pii/S0378779621001310}, author = {F.P. Souza and L.F.Q. Silveira and F.B. Costa and M.M. Leal}, keywords = {High impedance fault, cyclostationary analysis, alpha profile, distribution systems}, abstract = {Conventional overcurrent-based protection systems are generally not sensitive to high impedance faults (HIFs) since they have a low overcurrent amplitude. This type of fault causes damages to dealers and can provoke the deaths of people and animals. Therefore, different methods for identifying HIFs in electric power distribution systems have been proposed. However, besides the low fault overcurrent level be still a problem, the noise interference on signals is also a difficulty for non-conventional methods. Therefore, this work proposes a reliable method based on statistical characteristics for identifying HIFs regardless of the noise interference and the overcurrent level. Specifically, the method uses cyclostationary characteristic analysis to extract cyclic autocorrelation information from the signals of interest by calculating the cyclic spectral density function. From this information, HIFs can be properly identified among other power system disturbances. The performance of the method was assessed with actual HIF data and with realistic HIF simulations, presenting promising results.} } @Article{Fontes2021, author={Fontes, Aluisio I. R. and Linhares, Leandro L. S. and F. Guimar{\~a}es, Jo{\~a}o P. and Silveira, Luiz F. Q. and Martins, Allan M.}, title={An adaptive kernel width convex combination method for maximum correntropy criterion}, journal={Journal of the Brazilian Computer Society}, year={2021}, month={Mar}, day={23}, volume={27}, number={1}, pages={7}, abstract={Recently, the maximum correntropy criterion (MCC) has been successfully applied in numerous applications regarding nonGaussian data processing. MCC employs a free parameter called kernel width, which affects the convergence rate, robustness, and steady-state performance of the adaptive filtering. However, determining the optimal value for such parameter is not always a trivial task. Within this context, this paper proposes a novel method called adaptive convex combination maximum correntropy criterion (ACCMCC), which combines an adaptive kernel algorithm with convex combination techniques. ACCMCC takes advantage from a convex combination of two adaptive MCC-based filters, whose kernel widths are adjusted iteratively as a function of the minimum error value obtained in a predefined estimation window. Results obtained in impulsive noise environment have shown that the proposed approach achieves equivalent convergence rates but with increased accuracy and robustness when compared with other similar algorithms reported in literature.}, issn={1678-4804}, doi={10.1186/s13173-021-00111-z}, url={https://doi.org/10.1186/s13173-021-00111-z} } % --- ANO 2020 --- @inproceedings{ENCOM2020-49, author = {Frederico Augusto Fernandes Silveira and Francisco S. Lima Filho and Felipe Sampaio Dantas Silva and Agostinho de Medeiros Brito Junior and Luiz Felipe Silveira}, year = {2020}, pages = {49-50}, title = {Mitigação de DDoS Usando SDN}, url = {https://iecom.org.br/encom2020/autores.html#anais_sec}, booktitle = {Anais da X Conferência Nacional em Comunicações, Redes e Segurança da Informação}, publisher = {ENCOM} } @inproceedings{ENCOM2020-151, author = {Tadeu Ferreira Oliveira and Luiz Felipe Silveira}, year = {2020}, pages = {151-152}, title = {Impacto Energético do Processamento no Consumo de Controladores de Redes Definidas por Software}, url = {https://iecom.org.br/encom2020/autores.html#anais_sec}, booktitle = {Anais da X Conferência Nacional em Comunicações, Redes e Segurança da Informação}, publisher = {ENCOM} } @inproceedings{ENCOM2020-103, author = {Jose Lenival Gomes de França and Luiz Felipe de Queiroz Silveira}, year = {2020}, pages = {103-104}, title = {Hopping DFT Subamostrada}, url = {https://iecom.org.br/encom2020/autores.html#anais_sec}, booktitle = {Anais da X Conferência Nacional em Comunicações, Redes e Segurança da Informação}, publisher = {ENCOM} } @inproceedings{ENCOM2020-163, author = {Aluisio I. R. Fontes and Joao P. F. Guimarãe and Pedro T. V. de Souza and Tales V. R. de O. Câmara and Allan de M. Martins and Luiz F. de Q. Silveira}, year = {2020}, pages = {163-164}, title = {Extração de características Cicloestacionarias por Correntropia Cíclica em Canais com Desvanecimento}, url = {https://iecom.org.br/encom2020/autores.html#anais_sec}, booktitle = {Anais da X Conferência Nacional em Comunicações, Redes e Segurança da Informação}, publisher = {ENCOM} } @inproceedings{ENCOM2020-145, author = {Felipe O. S. Gama and Luiz F. Q. Silveira and Andres O. Salazar}, year = {2020}, pages = {145-146}, title = {Desempenho da Codificação Wavelet M-ária Sob Condições de Erros de Estimação do Canal}, url = {https://iecom.org.br/encom2020/autores.html#anais_sec}, booktitle = {Anais da X Conferência Nacional em Comunicações, Redes e Segurança da Informação}, publisher = {ENCOM} } @inproceedings{ENCOM2020-159, author = {Pedro T. V. de Souza and Aluisio I. F. Rego and Vinicius S. V. de Souza and Luiz F. Silveira}, year = {2020}, pages = {159-160}, title = {Classificação de Modulação utilizando Cicloestacionariedades e Árvores de Decisão}, url = {https://iecom.org.br/encom2020/autores.html#anais_sec}, booktitle = {Anais da X Conferência Nacional em Comunicações, Redes e Segurança da Informação}, publisher = {ENCOM} } @inproceedings{ENCOM2020-95, author = {Yuri P. Santos and Andressa Stefany Oliveira and Luiz Affonso Guedes and Luiz F. Q. Silveira}, year = {2020}, pages = {95-96}, title = {Classificação Automática de Modulaçõs: Uma Abordagem Evolutiva}, url = {https://iecom.org.br/encom2020/autores.html#anais_sec}, booktitle = {Anais da X Conferência Nacional em Comunicações, Redes e Segurança da Informação}, publisher = {ENCOM} } @inproceedings{ENCOM2020-139, author = {Cassiano P. Carvalho and Nathalee C.A. Lima and Pedro T.V. Souza and Luiz F. Silveira and Luiz M. G. Gonçalves}, year = {2020}, pages = {139-140}, title = {Classificação Automática de Modulações em Canal com Doppler Utilizando Redes Neurais e Perfil Alfa Reduzido}, url = {https://iecom.org.br/encom2020/autores.html#anais_sec}, booktitle = {Anais da X Conferência Nacional em Comunicações, Redes e Segurança da Informação}, publisher = {ENCOM} } @article{melo2020parallel, author = {Savio R. M. Melo and Herlan A. P. da Silva and Samuel Xavier de Souza and Luiz F. de Q. Silveira and Aluisio I. R. Fontes}, issn = {1548-0992}, journal = {IEEE Latin America Transactions}, year = {2020}, title = {{Parallel Performance Analysis of Cyclic Correntropy for Energy-Efficient Wireless Communications}}, url = {https://latamt.ieeer9.org/index.php/transactions/article/view/4450}, pages = {2089-2095} } @INPROCEEDINGS{FernandesSilveira2020, author={F. A. {Fernandes Silveira} and F. {Lima-Filho} and F. S. {Dantas Silva} and A. {de Medeiros Brito Junior} and L. F. {Silveira}}, booktitle={2020 International Conference on Systems, Signals and Image Processing (IWSSIP)}, title={Smart Detection-IoT: A DDoS Sensor System for Internet of Things}, year={2020}, pages={343-348}, doi={10.1109/IWSSIP48289.2020.9145265}, url = {\url{http://doi.org/10.1109/IWSSIP48289.2020.9145265}} } @inproceedings{sbesc_estendido, author = {Igor Silva and Otávio do Espírito Santo and Diego do Nascimento and Samuel Xavier-de-Souza}, title = {CEVERO: A soft-error hardened SoC for aerospace applications}, booktitle = {Anais Estendidos do X Simpósio Brasileiro de Engenharia de Sistemas Computacionais}, location = {Evento Online}, year = {2020}, keywords = {}, issn = {0000-0000}, pages = {121--126}, publisher = {SBC}, address = {Porto Alegre, RS, Brasil}, url = {\url{https://sol.sbc.org.br/index.php/sbesc_estendido/article/view/13100}} } @InProceedings{costa2020desenvolvimento, author = {S-F-da-Costa, Júlio Gustavo and Xavier-de-Souza, Samuel and Petta, Reinaldo Antônio}, title = {Desenvolvimento Guiado por Interpretação de Metadados}, booktitle = {ISLA 2020 Proceedings}, year = {2020}, number = {4}, url = {\url{https://aisel.aisnet.org/isla2020/4}}, } @article{Assis2020, author = {Assis, Italo A. S. and Fernandes, Joao B. and Barros, Tiago and Xavier-De-Souza, Samuel}, doi = {10.1109/ACCESS.2020.3015045}, issn = {2169-3536}, journal = {IEEE Access}, pages = {145115--145127}, title = {{Auto-Tuning of Dynamic Scheduling Applied to 3D Reverse Time Migration on Multicore Systems}}, url = {https://ieeexplore.ieee.org/document/9162016/}, volume = {8}, year = {2020} } @article{CoutinhoDemetrios2020, abstract = {This work proposes a methodology to find performance and energy trade-offs for parallel applications running on Heterogeneous Multi-Processing systems with a single instruction-set architecture. These offer flexibility in the form of different core types and voltage and frequency pairings, defining a vast design space to explore. Therefore, for a given application, choosing a configuration that optimizes the performance and energy consumption is not straightforward. Our method proposes novel analytical models for performance and power consumption whose parameters can be fitted using only a few strategically sampled offline measurements. These models are then used to estimate an application's performance and energy consumption for the whole configuration space. In turn, these offline predictions define the choice of estimated Pareto-optimal configurations of the model, which are used to inform the selection of the configuration that the application should be executed on. The methodology was validated on an ODROID-XU3 board for eight programs from the PARSEC Benchmark, Phoronix Test Suite and Rodinia applications. The generated Pareto-optimal configuration space represented a 99% reduction of the universe of all available configurations. Energy savings of up to 59.77%, 61.38% and 17.7% were observed when compared to the performance, ondemand and powersave Linux governors, respectively, with higher or similar performance.}, author = {{Coutinho Demetrios}, A. M. and {De Sensi}, Daniele and Lorenzon, Arthur Francisco and Georgiou, Kyriakos and Nunez-Yanez, Jose and Eder, Kerstin and Xavier-de-Souza, Samuel}, doi = {10.3390/en13092409}, issn = {1996-1073}, journal = {Energies}, keywords = {Energy efficiency,Heterogeneous multi-processing,Pareto frontier,Power model}, month = {may}, number = {9}, pages = {2409}, publisher = {MDPI AG}, title = {{Performance and Energy Trade-Offs for Parallel Applications on Heterogeneous Multi-Processing Systems}}, url = {https://www.mdpi.com/1996-1073/13/9/2409}, volume = {13}, year = {2020} } @article{Furtunato2020, abstract = {After Amdahl's trailblazing work, many other authors proposed analytical speedup models but none have considered the limiting effect of the memory wall. These models exploited aspects such as problem-size variation, memory size, communication overhead, and synchronization overhead, but data-access delays are assumed to be constant. Nevertheless, such delays can vary, for example, according to the number of cores used and the ratio between processor and memory frequencies. Given the large number of possible configurations of operating frequency and number of cores that current architectures can offer, suitable speedup models to describe such variations among these configurations are quite desirable for off-line or on-line scheduling decisions. This work proposes a new parallel speedup model that accounts for the variations on the average data-access delay to describe the limiting effect of the memory wall on parallel speedups in homogeneous shared-memory architectures. Analytical results indicate that the proposed modeling can capture the desired behavior while experimental hardware results validate the former. Additionally, we show that when accounting for parameters that reflect the intrinsic characteristics of the applications, such as the degree of parallelism and susceptibility to the memory wall, our proposal has significant advantages over machine-learning-based modeling. Moreover, our experiments show that conventional machine-learning modeling, besides being black-boxed, needs about one order of magnitude more measurements to reach the same level of accuracy achieved by the proposed model.}, author = {Furtunato, Alex F.A. and Georgiou, Kyriakos and Eder, Kerstin and Xavier-De-Souza, Samuel}, doi = {10.1109/ACCESS.2020.2990418}, issn = {21693536}, journal = {IEEE Access}, keywords = {Parallel systems,data access delay,memory wall,performance modeling,speedup}, pages = {79225--79238}, publisher = {Institute of Electrical and Electronics Engineers Inc.}, title = {{When parallel speedups hit the memory wall}}, volume = {8}, year = {2020}, url = {https://ieeexplore.ieee.org/document/9078685} } @article{Pena2020, abstract = {The aim of this letter is to propose a new robust method for time delay estimation over impulsive noise and investigate its practical implications. The method uses a non-linear data transformation associated with the generalized cross-correlation technique. Hence, simulations and experiments show better performance than traditional methods without increasing the computational cost. Our practical experiments indicate the possibility of obtaining a correlated impulsive noise, in which the proposed method is still presenting accurate estimations.}, author = {Pena, Danilo and Lima, Arthur and {de Sousa Jr}, Vicente and Silveira, Luiz and Martins, Allan}, doi = {10.14209/jcis.2020.9}, issn = {19806604}, journal = {Journal of Communication and Information Systems}, keywords = {Index Terms-direction-of-arrival estimation,acoustic noise,acoustic signal processing}, month = {apr}, number = {1}, pages = {86--89}, publisher = {Sociedad Brasileira de Telecomunicacoes}, title = {{Robust time delay estimation based on non-Gaussian impulsive acoustic channel}}, url = {https://jcis.sbrt.org.br/jcis/article/view/687}, volume = {35}, year = {2020} } @article{Pereira2020, abstract = {We propose an approach for the computation of time offsets between audio sequences that contain musical sounds from different instruments produced in a distributed way and have, as the main characteristic, the existence of a set of weak features that are not useful as alignment points in their current form. Therefore, it is necessary to apply transformations in order to find a set of distinctive features to compute the offset values in a suitable way. The main issue that occurs with such a system is its nonlinearity that does not allow the delay to be predicted by using a linear function. To solve this problem, we propose to use a set of Long Short-Term Memory (LSTM) layers to create a neural network model capable of learning such features transformations in a supervised approach using a gradient descent optimizer. We demonstrate the use of a recurrence matrix to extract timing information from a set of transformed features given by the neural network output.With this approach, we could classify up to 60% of a specific combination from the MedleyDB dataset and reduce the search space to five possibilities with an accuracy up to 90% while keeping the precision of 10 ms. This performance is equal to or better than state-of-the-art methods.}, author = {Pereira, Igor and Distante, Cosimo and Silveira, Luiz F. and Gonçalves, Luiz}, doi = {10.17743/jaes.2019.0057}, issn = {15494950}, journal = {AES: Journal of the Audio Engineering Society}, month = {mar}, number = {3}, pages = {157--167}, publisher = {Audio Engineering Society}, title = {{Using neural networks to compute time offsets from musical instruments}}, volume = {68}, year = {2020}, url = {https://www.aes.org/e-lib/browse.cfm?elib=20726} } @inproceedings{Pinheiro2020, abstract = {Lightweight coresets are compact representations of data sets such that clustering methods present competitive results in relation to the complete data set. They are constructed by sampling important points from the complete set. We propose a fast method to approximate the sampling of lightweight coresets from very large data sets which are distributed among multiple machines. We show that the proposed method is much faster and scalable, reaching results 48 times faster than the original lightweight coresets, while holding similar properties.}, author = {Pinheiro, Daniel N and Xavier-de-Souza, Samuel and Aloise, Daniel}, booktitle = {2020 IEEE International Parallel and Distributed Processing Symposium Workshops (IPDPSW)}, doi = {10.1109/IPDPSW50202.2020.00078}, isbn = {978-1-7281-7445-7}, keywords = {Big Data,distributed data,high-performance computing,k-means clustering,lightweight coresets}, month = {may}, pages = {426--429}, publisher = {IEEE}, title = {{Scaling Optimizations for Large-Scale Distributed Data with Lightweight Coresets}}, url = {https://ieeexplore.ieee.org/document/9150463/}, year = {2020} } @article{Pinheiro2020a, abstract = {K-medoids clustering is among the most popular methods for cluster analysis despite its use requiring several assumptions about the nature of the latent clusters. In this paper, we introduce the Convex Fuzzy k-Medoids (CFKM) model, which not only relaxes the assumption that objects must be assigned entirely to one and only one medoid, but also that medoids must be assigned entirely to one and only one cluster. The resulting model is convex, thus its resolution is completely robust to initialization. To illustrate the usefulness of the CFKM model, we compare it with two fuzzy k-medoids clustering models: the Fuzzy k-Medoids (FKM) and the Fuzzy Clustering with Multi-Medoids (FMMdd), both solved approximately by heuristics because of their hard computational complexity. Our experiments with both synthetic and real-world data as well as a user survey reveal that the model is not only more robust to the choice hyperparameters of the fuzzy clustering task, but also that it can uniquely discover important aspects of data inherently fuzzy in nature.}, author = {Pinheiro, Daniel N. and Aloise, Daniel and Blanchard, Simon J.}, doi = {10.1016/j.fss.2020.01.001}, issn = {01650114}, journal = {Fuzzy Sets and Systems}, keywords = {Categorization,Fuzzy clustering,Unsupervised learning}, month = {jun}, pages = {66--92}, publisher = {Elsevier B.V.}, title = {{Convex fuzzy k-medoids clustering}}, volume = {389}, year = {2020}, url = {https://www.doi.org/10.1016/j.fss.2020.01.001} } @article{Ramos2020, abstract = {This paper presents a fully automatic method for the separation of diffuse and specular reflection components from a single image. Overall, the mechanisms in which the available methods operate on are computationally costly and do not translate well to modern hardware-implemented image processing pipelines, such as the ones present in consumer electronics. Consequently, the objective of this article is to introduce a simple yet effective method for specular highlight removal. It is based on the dichromatic reflection model and operates through histogram matching in the YCbCr color space. The proposed method performs in real-time. It only uses global image statistics and point-wise intensity transformations. Experimental evaluation shows that the proposed approach has competitive results in comparison to state-of-the-art methods. Limitations of the proposed approach are seldom and are common to most methods available. The proposed method, however, achieves better quality results with much less computational cost, thus enabling feasibility in systems with limited processing power.}, author = {Ramos, Vítor S. and Silveira, Luiz Gonzaga De Q. and Silveira, Luiz Felipe De Q.}, doi = {10.1109/ACCESS.2019.2963037}, issn = {21693536}, journal = {IEEE Access}, keywords = {Blind source separation,feature extraction,image color analysis,image enhancement,image processing,image texture analysis}, pages = {3240--3254}, publisher = {Institute of Electrical and Electronics Engineers Inc.}, title = {{Single Image Highlight Removal for Real-Time Image Processing Pipelines}}, volume = {8}, year = {2020}, url = {https://www.doi.org/10.1109/ACCESS.2019.2963037} } @inproceedings{Rodrigues2020, abstract = {The growth of data to be processed in the Oil & Gas industry matches the requirements imposed by evolving algorithms based on stencil computations, such as Full Waveform Inversion and Reverse Time Migration. Graphical processing units (GPUs) are an attractive architectural target for stencil computations because of its high degree of data parallelism. However, the rapid architectural and technological progression makes it difficult for even the most proficient programmers to remain up-to-date with the technological advances at a micro-architectural level. In this work, we present an extension for an open source compiler designed to produce highly optimized finite difference kernels for use in inversion methods named Devito{\textcopyright}. We embed it with the Oxford Parallel Domain Specific Language (OP-DSL) in order to enable automatic code generation for GPU architectures from a high-level representation. We aim to enable users coding in a symbolic representation level to effortlessly get their implementations leveraged by the processing capacities of GPU architectures. The implemented backend is evaluated on a NVIDIA{\textregistered} GTX Titan Z, and on a NVIDIA{\textregistered} Tesla V100 in terms of operational intensity through the roof-line model for varying space-order discretization levels of 3D acoustic isotropic wave propagation stencil kernels with and without symbolic optimizations. It achieves approximately 63% of V100's peak performance and 24% of Titan Z's peak performance for stencil kernels over grids with 2563 points. Our study reveals that improving memory usage should be the most efficient strategy for leveraging the performance of the implemented solution on the evaluated architectures.}, archivePrefix = {arXiv}, arxivId = {1912.00695}, author = {Rodrigues, Vitor Hugo Mickus and Cavalcante, Lucas and Pereira, Maelso Bruno and Luporini, Fabio and Reguly, István and Gorman, Gerard and de Souza, Samuel Xavier}, booktitle = {Communications in Computer and Information Science}, doi = {10.1007/978-3-030-41005-6_16}, eprint = {1912.00695}, isbn = {9783030410049}, issn = {18650937}, keywords = {Devito,Domain Specific Languages,Finite-differences,GPU,OPS,Parallel architectures,Stencil kernels}, month = {sep}, pages = {230--244}, publisher = {Springer}, title = {{GPU Support for Automatic Generation of Finite-Differences Stencil Kernels}}, url = {https://link.springer.com/chapter/10.1007/978-3-030-41005-6_16}, volume = {1087 CCIS}, year = {2020} } @article{Silva-de-Souza2020, abstract = {{\textless}p{\textgreater}Run-time profiling of software applications is key to energy efficiency. Even the most optimized hardware combined to an optimally designed software may become inefficient if operated poorly. Moreover, the diversification of modern computing platforms and broadening of their run-time configuration space make the task of optimally operating software ever more complex. With the growing financial and environmental impact of data center operation and cloud-based applications, optimal software operation becomes increasingly more relevant to existing and next-generation workloads. In order to guide software operation towards energy savings, energy and performance data must be gathered to provide a meaningful assessment of the application behavior under different system configurations, which is not appropriately addressed in existing tools. In this work we present Containergy, a new performance evaluation and profiling tool that uses software containers to perform application run-time assessment, providing energy and performance profiling data with negligible overhead (below 2%). It is focused on energy efficiency for next generation workloads. Practical experiments with emerging workloads, such as video transcoding and machine-learning image classification, are presented. The profiling results are analyzed in terms of performance and energy savings under a Quality-of-Service (QoS) perspective. For video transcoding, we verified that wrong choices in the configuration space can lead to an increase above 300% in energy consumption for the same task and operational levels. Considering the image classification case study, the results show that the choice of the machine-learning algorithm and model affect significantly the energy efficiency. Profiling datasets of AlexNet and SqueezeNet, which present similar accuracy, indicate that the latter represents 55.8% in energy saving compared to the former.{\textless}/p{\textgreater}}, author = {Silva-de-Souza, Wellington and Iranfar, Arman and Bráulio, Anderson and Zapater, Marina and Xavier-de-Souza, Samuel and Olcoz, Katzalin and Atienza, David}, doi = {10.3390/en13092162}, issn = {1996-1073}, journal = {Energies}, keywords = {DVFS,Energy profiling,Performance counters,Performance profiling,Software containers}, month = {may}, number = {9}, pages = {2162}, publisher = {MDPI AG}, title = {{Containergy—A Container-Based Energy and Performance Profiling Tool for Next Generation Workloads}}, url = {https://www.mdpi.com/1996-1073/13/9/2162}, volume = {13}, year = {2020} } @inproceedings{souzafilho2020, author = {{SOUZA FILHO}, R A and NASCIMENTO, D V C and Xavier-de-Souza, Samuel}, booktitle = {Proceedings of The Thirteenth International Workshop on Programmability and Architectures for Heterogeneous Multicores}, title = {{An OpenMP translator for GAP8 MPSoC}}, url = {https://arxiv.org/abs/2007.10219}, year = {2020} } @article{ValeriodeSouza2020, abstract = {In mobile communication systems, the signals propagate through multipath over time-varying channels, which are subject to distortion caused by fading and Doppler shifts. In order to minimize such distortions, coding techniques and transmission diversity can be employed, e.g., wavelet coding. In this work, the wavelet coding is investigated in scenarios of cognitive radio systems with dynamic spectrum access. Cognitive radio systems with dynamic spectrum access should be able to sense unoccupied frequency bands for opportunistic transmissions, as well as detect the presence of primary users when they occupy their licensed spectrum. Therefore, an essential element for the accurate operation of cognitive radio systems encoded by wavelet coding is the ability to sense the signals encoded by this technique. It is effectively demonstrated that the possibility of sensing such signals is associated with a suitable design of the signal constellation used in the modulation of the coded symbols. The constellation design of these is performed via genetic algorithms using a multiobjective optimization approach. The developed system is evaluated according to the robustness to time-varying flat fading through a bit error probability (BER) versus {\textless}italic{\textgreater}E{\textless}/italic{\textgreater}{\textless}sub{\textgreater}{\textless}italic{\textgreater}b{\textless}/italic{\textgreater}{\textless}/sub{\textgreater}/{\textless}italic{\textgreater}N{\textless}/italic{\textgreater}{\textless}sub{\textgreater}0{\textless}/sub{\textgreater} analysis. The spectral sensing ability is also addressed employing the cyclostationary analysis. The results denote the feasibility of using wavelet coding in radio scenarios with dynamic spectrum access, with good performance in terms of BER and signal detection rates. }, author = {{Valério de Souza}, Pedro Thiago and {Valério de Souza}, Vinícius Samuel and {Felipe de Queiroz Silveira}, Luiz}, doi = {10.1155/2020/9863785}, editor = {López-Benítez, Miguel}, issn = {1530-8669}, journal = {Wireless Communications and Mobile Computing}, pages = {9863785}, publisher = {Hindawi}, title = {{Design of Wavelet-Encoded Symbol Constellations for Cyclostationary Spectrum Sensing}}, url = {https://doi.org/10.1155/2020/9863785}, volume = {2020}, year = {2020} } @article{Silva_Santos_Jr_Silveira_2019, title={NOMA: Um Estudo Bibliométrico}, url={https://periodicos.ufersa.edu.br/ecop/article/view/8851}, journal={Anais do Encontro de Computação do Oeste Potiguar ECOP/UFERSA}, issn = {2526-7574}, author={Silva, Jessika Cristina da and Santos, Yuri Pedro Dos and Jr, Vicente A. de Sousa and Silveira, Luiz F.}, year={2019}, } @inproceedings{Silva2019, abstract = {Energy efficiency is a growing concern for modern computing, especially for HPC due to operational costs and the environmental impact, considering that processors have an important role in this energy consumption. In this work, we propose a methodology to find energy-optimal frequency and number of active cores to run single-node HPC applications using an application-agnostic power model of the architecture and an architecture-aware performance model of the application. We characterize the application performance using machine learning, specifically the 'Support Vector Regression' algorithm. Besides that, the power consumption is estimated by modeling CMOS dynamic and static power without knowledge of the application. So, The energy-optimal configuration is estimated by minimizing the product these two models outcomes, the power model and the performance model. Then, the final model can be used to find better frequency and number of cores to aim energy efficiency application execution. Results were obtained for four PARSEC applications and, with five different inputs shows that the proposed approach used substantially less energy when compared to the DVFS governor, in best cases and worst cases.}, author = {Silva, Vitor R.G. and Furtunato, Alex F.A. and Georgiou, Kyriakos and Sakuyama, Carlos A.V. and Eder, Kerstin and Xavier-De-Souza, Samuel}, booktitle = {2019 International Conference on High Performance Computing and Simulation, HPCS 2019}, doi = {10.1109/HPCS48598.2019.9188110}, isbn = {9781728144849}, keywords = {Energy Efficient Software,Performance Modeling.,Power Modeling}, month = {jul}, pages = {448--454}, publisher = {IEEE}, title = {{Energy-Optimal Configurations for Single-Node HPC Applications}}, url = {https://ieeexplore.ieee.org/document/9188110/}, year = {2019} } @article{Assis2019, author = {Assis, Italo A S and Oliveira, Antonio D S and Barros, Tiago and Sardina, Idalmis M and Bianchini, Calebe P and {Xavier De-Souza}, Samuel}, doi = {10.1109/ACCESS.2019.2939100}, issn = {2169-3536}, journal = {IEEE Access}, keywords = {Assis2019,Distributed Memory,Load balancing,One-Sided Communication,Reverse Time Migration,Work-Stealing}, pages = {128419--128430}, title = {{Distributed-Memory Load Balancing With Cyclic Token-Based Work-Stealing Applied to Reverse Time Migration}}, url = {https://ieeexplore.ieee.org/document/8822671/}, volume = {7}, year = {2019} } @article{Camara2019, abstract = {Cyclostationary analysis has several applications in communications, e.g., spectral sensing, signal parameter estimation, and modulation classification. Most of them consider the additive white Gaussian noise (AWGN) channel model, although wireless communication systems may also be subject to non-Gaussian interference and impulsive noise. In this context, the communication channel can be better modeled by heavy-tailed distributions, such as the non-Gaussian alpha-stable one. Some applications of the cyclostationary approach based on the spatial sign cyclic correlation function (SSCCF), fractional lower-order cyclic autocorrelation function (FLOCAF), and cyclic correntropy function (CCF) demonstrate that these are promising solutions for the analysis of signals in the presence of impulsive non-Gaussian noise. However, the investigation of functions above applied to digital modulation recognition in impulsive environments, and the comparison among them are topics that did not adequately explore yet. This work demonstrates that SSCCF is a particular case of the FLOCAF. Besides, a detailed analysis of the use of the FLOCAF and CCF is presented to obtain cyclostationary descriptors for the recognition of digital modulations BPSK, QPSK, 8-QAM, 16-QAM, and 32-QAM. Automatic modulation classification (AMC) architectures, based on the functions mentioned above, are also proposed. Besides, another contribution showed is that both the FLOCAF and CCF allow the symbol rate parameter estimation. The performances of AMC architectures were evaluated in the scenario with modulated signals contaminated with additive non-Gaussian alpha-stable noise. The results demonstrate that both architectures can classify signals in different contamination scenarios. However, the architecture based on the CCF is more efficient than the FLOCAF-based one.}, author = {Câmara, Tales V.R.O. and Lima, Arthur D.L. and Lima, Bruno M.M. and Fontes, Aluisio I.R. and Martins, Allan De M. and Silveira, Luiz F.Q.}, doi = {10.1109/ACCESS.2019.2943300}, issn = {21693536}, journal = {IEEE Access}, keywords = {Additive non-Gaussian alpha-stable noise,Automatic modulation recognition,Correntropy,Cyclic correntropy function,Cyclostationary descriptors,Digital modulations,Fractional lower-order cyclic autocorrelation func,Impulsive noise,Spatial sign cyclic correlation function}, pages = {138512--138527}, publisher = {Institute of Electrical and Electronics Engineers Inc.}, title = {{Automatic modulation classification architectures based on cyclostationary features in impulsive environments}}, volume = {7}, year = {2019}, url = {https://www.doi.org/10.1109/ACCESS.2019.2943300} } @inproceedings{CiriloDoNascimento2019, abstract = {The critical path delay and, as a consequence, the maximum operating frequency of a digital system are dependent on the supply voltage, so is its power consumption. Typically, voltage guard bands are added in order to improve reliability, at the expense of power efficiency. It has been shown that error detection and correction (EDAC) techniques can be used to mitigate the effects of the reduced safety margins. This Ph.D. project aims to develop a MPSoC capable of self regulate its operating voltage by monitoring the error rate reported by a EDAC system, virtually eliminating voltage safety margins. Literature review and preliminary experiments supports the viability of this approach, motivating further investigation.}, author = {{Cirilo Do Nascimento}, Diego V. and Georgiouy, Kyriakos and Edery, Kerstin I. and Xavier-De-Souza, Samuel}, booktitle = {IEEE/IFIP International Conference on VLSI and System-on-Chip, VLSI-SoC}, doi = {10.1109/VLSI-SoC46951.2019.9047904}, url = {https://www.doi.org/10.1109/VLSI-SoC46951.2019.9047904}, issn = {23248440}, keywords = {Computer architecture,Energy efficiency,Guardband,Undervolting}, publisher = {IEEE Computer Society}, title = {{Exploiting guard band limits for energy gains in MPSoCs}}, volume = {2019-Janua}, year = {2019} } @article{Costa2019, abstract = {{\textless}p{\textgreater}The acquisition is the most time-consuming step performed by a Global Navigation Satellite System (GNSS) receiver. The objective is to detect which satellites are transmitting and what are the phase and Doppler frequency shift of the signal. It is the step with the highest computational complexity, especially for signals subjected to large Doppler shifts. Improving acquisition performance has a large impact on the overall performance of the GNSS reception. In this paper, we present a two-step Global Positioning System (GPS) acquisition algorithm whose first step performs an incremental correlation to find a coarse pair of phase and frequency and the second step, triggered by the variance of the largest correlation values, refines the first step. The proposed strategy, based on the conventional time-domain serial algorithm, reduces the average execution time of the acquisition process to about 1/5 of the conventional acquisition while keeping the same modest logic hardware requirements and slightly better success and false-positive rates. Additionally, the new method reduces memory usage by a factor that is proportional to the signal's sampling frequency. All these advantages over conventional acquisition contribute together to significantly improve the overall performance and cost of GPS receivers.{\textless}/p{\textgreater}}, author = {Costa, Fabrício and Albuquerque, Glauberto Leilson and Silveira, Luiz Felipe and Valderrama, Carlos and Xavier-de-Souza, Samuel}, doi = {10.3390/s19143177}, issn = {1424-8220}, journal = {Sensors}, keywords = {GPS acquisition,Two-step acquisition,Variance-based detection threshold}, month = {jul}, number = {14}, pages = {3177}, publisher = {MDPI AG}, title = {{Variance-Triggered Two-Step GPS Acquisition}}, url = {https://www.mdpi.com/1424-8220/19/14/3177}, volume = {19}, year = {2019} } @inproceedings{Coutinho2019, abstract = {This work proposes a novel methodology to predict the optimal performance and energy efficiency trade-off configurations of parallel applications running on a two-cluster Heterogeneous Multi-Processing (HMP) system. we propose an analytic performance and power model that are generated offline using data measurements. These models are then used to estimate the whole configuration space to predict the application's performance and energy consumption. Then, we use these off-line predictions to choose Pareto-optimal configurations, which is the most efficient among all configurations for the given architecture and multi-threaded application. We validated our methodology on an ODROID XU3 board on several PARSEC and Phoronix Test Suite applications.}, author = {Coutinho, Demetrios A.M. and Georgiou, Kyriakos and Eder, Kerstin I. and Nunez-Yanez, Jose and Xavier-De-Souza, Samuel}, booktitle = {IEEE/IFIP International Conference on VLSI and System-on-Chip, VLSI-SoC}, doi = {10.1109/VLSI-SoC.2019.8920384}, url = {https://www.doi.org/10.1109/VLSI-SoC.2019.8920384}, isbn = {9781728139159}, issn = {23248440}, keywords = {Energy and Performance trade-offs,Energy modeling,Heterogeneous Multi-Processing,Pareto Frontier,Performance modeling}, month = {oct}, pages = {232--233}, publisher = {IEEE Computer Society}, title = {{Performance and Energy Efficiency Trade-Offs in Single-ISA Heterogeneous Multi-Processing for Parallel Applications}}, volume = {2019-Octob}, year = {2019} } @inproceedings{DaSilva2019, abstract = {Taking advantage of the growing number of cores in supercomputers to increase the scalability of parallel programs is an increasing challenge. Many advanced profiling tools have been developed to assist programmers in the process of analyzing data related to the execution of their program. Programmers can act upon the information generated by these data and make their programs reach higher performance levels. However, the information provided by profiling tools is generally designed to optimize the program for a specific execution environment, with a target number of cores and a target problem size. A code optimization driven towards scalability rather than specific performance requires the analysis of many distinct execution environments instead of details about a single environment. With the goal of providing more useful information for the analysis and optimization of code for parallel scalability, this work introduces the PaScal Viewer tool. It presents an novel and productive way to visualize scalability trends of parallel programs. It consists of four diagrams that offers visual support to identify parallel efficiency trends of the whole program, or parts of it, when running on scaling parallel environments with scaling problem sizes.}, author = {da Silva, Anderson B.N. and Cunha, Daniel A.M. and Silva, Vitor R.G. and Alex, Alex F. and Xavier-de-Souza, Samuel}, booktitle = {Lecture Notes in Computer Science (including subseries Lecture Notes in Artificial Intelligence and Lecture Notes in Bioinformatics)}, doi = {10.1007/978-3-030-17872-7_15}, isbn = {9783030178710}, issn = {16113349}, keywords = {Efficiency,Parallel programming,Performance optimization,Scalability,Visualization tool}, month = {nov}, pages = {250--264}, publisher = {Springer Verlag}, title = {{PaScal Viewer: A Tool for the Visualization of Parallel Scalability Trends}}, url = {https://link.springer.com/chapter/10.1007/978-3-030-17872-7_15}, volume = {11027 LNCS}, year = {2019} } @article{DeSouza2019, abstract = {In cellular systems, information signals must be transmitted at high rates and with high reliability. One of the possible solutions to meet such criteria is the use of systems with multiple transmitting and/or receiving antenna arranged in the form of a multiple-input, multiple-output (MIMO) system. However, signal processing techniques in MIMO systems are developed under the assumption of transmission on Gaussian channels, which may lead to the decrease of efficiency in non-Gaussian communication scenarios. In this context, the widespread use of MIMO systems in recent years has motivated the development of new processing techniques that can be employed in scenarios that also consider the presence of non-Gaussian noise in communication channels. This work proposes a novel signal detection technique for MIMO systems, which is called maximum correntropy detector (MCD), being adequate to environments characterized by Gaussian and non-Gaussian noise. The introduced approach is based on complex correntropy function and can be seen as a generalization of the maximum likelihood detector (MLD) concept. The MCD is evaluated on Gaussian and non-Gaussian channels, where superior performance is achieved when compared with the classic detectors, without significant increase of the computational complexity.}, author = {{De Souza}, Pedro T.V. and Fontes, Aluisio I.R. and {De Souza}, Vinicius S.V. and Silveira, Luiz F.}, doi = {10.1109/ACCESS.2019.2942822}, url = {https://www.doi.org/10.1109/ACCESS.2019.2942822}, issn = {21693536}, journal = {IEEE Access}, keywords = {Complex correntropy,maximum correntropy detector,multiple-input multiple-output systems,non-Gaussian noise,signal detectors}, pages = {137517--137527}, publisher = {Institute of Electrical and Electronics Engineers Inc.}, title = {{A Novel Signal Detector in MIMO Systems Based on Complex Correntropy}}, volume = {7}, year = {2019} } @inproceedings{DeSouza2019a, abstract = {In this work we present ContainEnergy, a new performance evaluation and profiling tool that uses software containers to perform application runtime assessment, providing energy and performance profiling data. It is focused on energy efficiency for next generation workloads and IT infrastructure.}, author = {{De Souza}, Wellington Silva and Iranfar, Arman and Silva, Anderson and Zapater, Marina and {De Souza}, Samuel Xavier and Olcoz, Katzalin and Atienza, David}, booktitle = {IEEE/IFIP International Conference on VLSI and System-on-Chip, VLSI-SoC}, doi = {10.1109/VLSI-SoC.2019.8920379}, url = {https://www.doi.org/10.1109/VLSI-SoC.2019.8920379}, isbn = {9781728139159}, issn = {23248440}, keywords = {DVFS,energy profiling,performance counters,performance profiling,software containers}, month = {oct}, pages = {230--231}, publisher = {IEEE Computer Society}, title = {{A QoS and Container-Based Approach for Energy Saving and Performance Profiling in Multi-Core Servers}}, volume = {2019-Octob}, year = {2019} } @inproceedings{Iranfar2019, abstract = {Accurate workload prediction and throughput estimation are keys in efficient proactive power and performance management of multi-core platforms. Although hardware performance counters available on modern platforms contain important information about the application behavior, employing them efficiently is not straightforward when dealing with time-varying applications even if they have iterative structures. In this work, we propose a machine learning-based framework for workload prediction and throughput estimation using hardware events. Our framework enables throughput estimation over various available system configurations, namely, number of parallel threads and operating frequency. In particular, we first employ workload clustering and classification techniques along with Markov chains to predict the next workload for each available system configuration. Then, the predicted workload is used to estimate the next expected throughput through a machine learning-based regression model. The comparison with state of the art demonstrates that our framework is able to improve Quality of Service (QoS) by 3.4x, while consuming 15 less power thanks to the more accurate throughput estimation.}, author = {Iranfar, Arman and Souza, Wellington Silva De and Zapater, Marina and Olcoz, Katzalin and Souza, Samuel Xavier De and Atienza, David}, booktitle = {IEEE/IFIP International Conference on VLSI and System-on-Chip, VLSI-SoC}, doi = {10.1109/VLSI-SoC.2019.8920309}, url = {https://www.doi.org/10.1109/VLSI-SoC.2019.8920309}, isbn = {9781728139159}, issn = {23248440}, month = {oct}, pages = {211--216}, publisher = {IEEE Computer Society}, title = {{A Machine Learning-Based Framework for Throughput Estimation of Time-Varying Applications in Multi-Core Servers}}, volume = {2019-Octob}, year = {2019} } @article{LimaFilho2019, abstract = {Users and Internet service providers (ISPs) are constantly affected by denial-of-service (DoS) attacks. This cyber threat continues to grow even with the development of new protection technologies. Developing mechanisms to detect this threat is a current challenge in network security. This article presents a machine learning- (ML-) based DoS detection system. The proposed approach makes inferences based on signatures previously extracted from samples of network traffic. The experiments were performed using four modern benchmark datasets. The results show an online detection rate (DR) of attacks above 96&{\#}x0025;, with high precision (PREC) and low false alarm rate (FAR) using a sampling rate (SR) of 20&{\#}x0025; of network traffic.}, author = {de {Lima Filho}, Francisco Sales and Silveira, Frederico A F and {de Medeiros Brito Junior}, Agostinho and Vargas-Solar, Genoveva and Silveira, Luiz F}, doi = {10.1155/2019/1574749}, editor = {Maglaras, Leandros}, issn = {1939-0114}, journal = {Security and Communication Networks}, pages = {1574749}, publisher = {Hindawi}, title = {{Smart Detection: An Online Approach for DoS/DDoS Attack Detection Using Machine Learning}}, url = {https://doi.org/10.1155/2019/1574749}, volume = {2019}, year = {2019} } @inproceedings{Oliveira2019, abstract = {This paper presents a proposal for energy optimization on Software-Defined Network (SDN) by a proper controller placement. First, the discussion shows the definition of SDN and the role of controllers, then the current state-of-the-art on distributed SDN controllers is briefly discussed showing that current research on this topic focuses on fault-tolerance and load-balancing. Then the energy saving SDN strategies are presented and the problem of saving energy on the control-plane is given further details. A new approach based on parallelism and lower processor frequencies is demonstrated finally, the expected results and key contributions are defined.}, author = {Oliveira, Tadeu F. and Silveria, Luiz Felipe Q.}, booktitle = {2019 4th International Conference on Fog and Mobile Edge Computing, FMEC 2019}, doi = {10.1109/FMEC.2019.8795343}, url = {https://www.doi.org/10.1109/FMEC.2019.8795343}, isbn = {9781728117966}, keywords = {SDN,controller placement,energy savings,software-defined-network}, month = {jun}, pages = {86--89}, publisher = {Institute of Electrical and Electronics Engineers Inc.}, title = {{Distributed SDN controllers optimization for energy saving}}, year = {2019} } @inproceedings{Ramos2019, abstract = {The analysis of application performance is essential to better exploit its potential on High-Performance Computing (HPC) architectures. Access to performance counters, available in modern processors, allows collecting key information about program behavior to provide the most appropriate HPC execution strategy. In this context, we have developed an accurate tool based on performance counters, which facilitates modeling, fingerprinting, behavior comparison and clustering of applications. It provides a high-level Python API for accessing and configuring performance counters. While the execution and counters gathering is performed by a C++ module to reduce overheads. Moreover, the accuracy of this multiplatform tool was also compared to existing alternatives. Key features, such as performance counters collection, post-processing, and comparison, enable fingerprinting of applications, an important step in understanding program behavior for later classification and optimization according to the parameters characterizing the target HPC platform. For demonstration purposes, the tool was used in the clustering of Polybench applications, a frequently used benchmark set for kernels monitoring. This clustering helped the identification of applications with similar and comparable behaviors in terms of input size, data accesses and movements, resource utilization, and computation, which facilitates the creation of test sets for a given environment, according to specific measurement parameters.}, author = {Ramos, Vitor and Valderrama, Carlos and {Xavier De Souza}, Samuel and Manneback, Pierre}, booktitle = {Proceedings - 2019 IEEE 33rd International Parallel and Distributed Processing Symposium Workshops, IPDPSW 2019}, doi = {10.1109/IPDPSW.2019.00130}, url = {https://www.doi.org/10.1109/IPDPSW.2019.00130}, isbn = {9781728135106}, keywords = {Clustering,Fingerprinting,Modeling,Parallel Applicaitons,Performance Counters}, month = {may}, pages = {797--804}, publisher = {Institute of Electrical and Electronics Engineers Inc.}, title = {{An accurate tool for modeling, fingerprinting, comparison, and clustering of parallel applications based on performance counters}}, year = {2019} } @inproceedings{Santana2019, abstract = {Full waveform inversion has gained attention in the geophysics community as an efficient technique for the determination of seismic subsurface velocity models. However, the full waveform inversion technique is computationally intensive, both in terms of execution time and memory usage. In order to obtain shorter execution times, usually the full waveform inversion algorithm is implemented using the concept of parallel programming. For the implementation in distributed memory environments, it is important to define the tasks (processes) distribution among the computational nodes, which is known as workload scheduling. The workload scheduling approach directly impacts on computationally intensive algorithms, such as the seismic wave propagation, highly employed in full waveform inversion. For a large number of nodes and tasks, the full waveform inversion might suffer of scalability issues. In this work we compare two workload scheduling approaches for a parallel 2D acoustic full waveform inversion implementation running in a distributed memory system: the centralized dynamic and the decentralized static. The comparison is made by presenting speedup and efficiency plots for different model sizes and number of nodes. The scalability and performance analysis showed that the decentralized static algorithm is highly scalable and efficient in distributed memory systems.}, author = {Santana, Carla and Barros, Tiago and Milian, Idalmis and Bianchini, Calebe and Xavier-de-Souza, Samuel}, booktitle = {Proceedings of the 16th International Congress of the Brazilian Geophysical Society{\&}Expogef}, doi = {10.22564/16cisbgf2019.223}, pages = {1--5}, publisher = {Brazilian Geophysical Society}, title = {{Workload scheduling comparison in a full waveform inversion distributed memory implementation}}, url = {{https://sbgf.org.br/mysbgf/eventos/expanded_abstracts/16th_CISBGf/session/MACHINE LEARNING AND ARTIFICIAL INTELLIGENCE/Workload scheduling comparison in a full waveform inversion distributed memory implementation.pdf}}, year = {2019} } @techreport{Silva2019, abstract = {Neste trabalho ´e realizado um estudo bibliom´etrico para levantamento de tendˆencias tecnol´ogicas do NOMA (Non-Orthogonal Multiple Access). Esse levantamento ´e importante para pesquisadores que estejam cogitando investir esforc¸os na tecnologia NOMA e precisem mapear seu est´agio de desenvolvimento. As bases de publicac¸ ˜oes cient´ıficas Web of Science e Scopus foram utilizadas com a finalidade de identificar as ´areas de aplicac¸ ˜ao e t´ecnicas relacionadas ao NOMA bem como inferir a maturidade tecnol´ogica de cada uma delas. Os dados coletados mostram uma evoluc¸ ˜ao exponencial no n´umero de publicac¸ ˜oes envolvendo NOMA, com um grande destaque para aquelas vinculadas aos sistemas 5G.}, author = {da Silva, Jessika Cristina and Santos, Yuri Pedro Dos and Jr, Vicente A. de Sousa and Silveira, Luiz F.}, booktitle = {Anais do Encontro de Computação do Oeste Potiguar ECOP/UFERSA (ISSN 2526-7574)}, issn = {2526-7574}, month = {aug}, number = {3}, title = {{NOMA: Um Estudo Bibliométrico}}, url = {https://periodicos.ufersa.edu.br/index.php/ecop/article/view/8851}, year = {2019} } @inproceedings{silva2019, address = {Dublin}, author = {Silva, Vitor R G and Furtunato, Alex F A and Georgiou, Kyriakos and Valderrama, Carlos and Eder, Kerstin and Xavier-de-Souza, S}, booktitle = {Proceedings of the 17th International Conference on High Performance Computing & Simulation}, title = {{Energy-Optimal Configurations for Single-Node HPC Applications}}, url = {https://arxiv.org/abs/1805.00998}, year = {2019} } @inproceedings{silveira2019a, address = {Petrolina}, author = {SILVEIRA, F A F and {LIMA FILHO}, F S and {BRITO JUNIOR}, A M and Silveira, Luiz F}, booktitle = {Anais da Conferência Nacional em Comunicações, Redes e Segurança da Informação}, title = {{Sensor IoT para Detecçãção de DDoS}}, year = {2019} } @inproceedings{souza2019c, address = {Petrolina}, author = {Souza, P T V and SOUZA, V S V and Silveira, Luiz F}, booktitle = {Anais da Conferência Nacional em Comunicações, Redes e Segurança da Informação}, title = {{Projeto de Constelações Adequadas ao Sensoriamento Espectral por Cicloestacionariedades}}, year = {2019} } @inproceedings{souza2019b, address = {Petrolina}, author = {Souza, P T V and SOUZA, V S V and Silveira, Luiz F}, booktitle = {Anais da Conferência Nacional em Comunicações, Redes e Segurança da Informação}, title = {{Arquitetura de Sensoriamento Espectral Utilizando um Comitê de Detectores de Cicloestacionariedades}}, year = {2019} } @article{Souza2019, abstract = {{\textless}p{\textgreater}This work presents a novel spectral sensing method for the detection of signals presenting nonlinear phase variation over time. The introduced method is based on the angle-time cyclostationarity theory, which applies transformations to the signal to be sensed in order to mitigate the effects of nonlinear phase variation. The architecture is employed for sensing binary phase shift keying (BPSK) signals, being also compared with time cyclostationarity. The obtained simulation results clearly demonstrate the efficiency of the proposed approach, while presenting improved performance in terms of the detection rate of primary users increased by about 8 dB.{\textless}/p{\textgreater}}, author = {Souza, Pedro and Souza, Vinicius and Silveira, Luiz F.}, doi = {10.3390/s19194222}, issn = {1424-8220}, journal = {Sensors}, keywords = {Angle-time cyclostationarity,Cognitive radio,Cyclostationarity,Dynamic spectrum access,Spectral sensing}, month = {sep}, number = {19}, pages = {4222}, publisher = {MDPI AG}, title = {{Analysis of Spectral Sensing Using Angle-Time Cyclostationarity}}, url = {https://www.mdpi.com/1424-8220/19/19/4222}, volume = {19}, year = {2019} } @article{AndreNeves2018, abstract = {This article presents the analysis and comparison of two powerful tools to explore design space and study multi-core microprocessors. Heracles, developed at the MIT, is a modular tool to create MIPS multi-core processors. Its modularity allows quick development by varying the types of processor, memory, network interconnect and cache. RISC-V is a new instruction set architecture, developed at the University of California, Berkeley, that has several tools for designing architectures and processors that use this instruction set. The Rocket Chip Generator is one of these tools. It is the equivalent of Heracles for the MIPS architecture and, as such, provide several features that allows rapid development of RISC-V multi-core processors. We compared the target hardware and software features of these tools. The Rocket Chip Generator proved to be an excellent tool for the development of new RISC-V processors whereas Heracles seemed a more adequate tool for teaching and parallel architecture research at higher levels of abstraction.}, author = {{André Neves}, Eduardo; Xavier-de-Souza, Samuel}, doi = {10.17706/jcp.13.5.555-563}, url = {https://www.doi.org/10.17706/jcp.13.5.555-563}, issn = {1796203X}, journal = {Journal of Computers}, pages = {555--563}, publisher = {International Academy Publishing (IAP)}, title = {{Exploring Multi-core Design Space: Heracles vs. Rocket Chip Generator}}, year = {2018} } @inproceedings{Barros2018, address = {Santander}, author = {Barros, T. and Fernandes, J. B. and Souza-de-Assis, I. A. and {Xavier de Souza}, S.}, booktitle = {First EAGE Workshop on High Performance Computing for Upstream in Latin America}, doi = {10.3997/2214-4609.201803072}, keywords = {Barros2018}, month = {sep}, publisher = {EarthDoc}, title = {{Auto-Tuning of 3D Acoustic Wave Propagation in Shared Memory Environments}}, url = {http://www.earthdoc.org/publication/publicationdetails/?publication=94579}, year = {2018} } @article{Cosme2018, abstract = {The inversion of extremely high order matrices has been a challenging task because of the limited processing and memory capacity of conventional computers. In a scenario in which the data does not fit in memory, it is worth to consider exchanging less memory usage for more processing time in order to enable the computation of the inverse which otherwise would be prohibitive. We propose a new algorithm to compute the inverse of block partitioned matrices with a reduced memory footprint. The algorithm works recursively to invert one block of a k × k block matrix M, with k ≥ 2, based on the successive splitting of M. It computes one block of the inverse at a time, in order to limit memory usage during the entire processing. Experimental results show that, despite increasing computational complexity, matrices that otherwise would exceed the memory-usage limit can be inverted using this technique.}, author = {Cosme, Iria C.S. and Fernandes, Isaac F. and de Carvalho, João L. and Xavier-de-Souza, Samuel}, doi = {10.1016/j.amc.2018.01.051}, url = {https://www.doi.org/10.1016/j.amc.2018.01.051}, issn = {00963003}, journal = {Applied Mathematics and Computation}, keywords = {Block matrices,Large matrices,Low memory usage,Recursive matrix inversion,Schur complement}, month = {jul}, pages = {125--136}, publisher = {Elsevier Inc.}, title = {{Memory-usage advantageous block recursive matrix inverse}}, volume = {328}, year = {2018} } @inproceedings{araujo2018, address = {Rio de Janeiro}, author = {de Araújo, João Medeiros and do Nascimento, Hugo Alexandre Dantas and Jradi, Walid Abdala Rfaei and BARROS, T and Xavier-de-Souza, Samuel and LUCENA, L S}, booktitle = {Anais do Rio Oil&Gas}, title = {{Estratégias de Otimização de Código para Propagação de Onda em FWI}}, year = {2018} } @inproceedings{Fernandes2018, address = {Rio de Janeiro}, author = {Fernandes, João B. and Souza-de-Assis, ítalo A. and Barros, Tiago and Xavier-de-Souza, Samuel}, booktitle = {Rio Oil & Gas}, keywords = {Fernandes2018}, title = {{Automatic Scheduler for 3D Seismic Modeling by Finite Differences}}, url = {https://stt.ibp.org.br/eventos/2018/riooil2018/pdfs/Riooil2018_1901_201806151345riooeg_end_paper.pdf}, year = {2018} } @book{gama2018, author = {GAMA, F O S and SILVEIRA, LUIZ F Q and SALAZAR, A O}, edition = {first}, publisher = {Editorial Académica Española}, title = {{Perspectiva de redes de sensores inalámbricos en un sistema de control}}, url = {https://www.amazon.com/Perspectiva-sensores-inalámbricos-sistema-control/dp/6202123346}, year = {2018} } @inproceedings{Georgiou2018, abstract = {This paper presents the interesting observation that by performing fewer of the optimizations available in a standard compiler optimization level such as -O2, while preserving their original ordering, significant savings can be achieved in both execution time and energy consumption. This observation has been validated on two embedded processors, namely the ARM Cortex-M0 and the ARM Cortex-M3, using two different versions of the LLVM compilation framework; v3.8 and v5.0. Experimental evaluation with 71 embedded benchmarks demonstrated performance gains for at least half of the benchmarks for both processors. An average execution time reduction of 2.4% and 5.3% was achieved across all the benchmarks for the Cortex-M0 and Cortex-M3 processors, respectively, with execution time improvements ranging from 1% up to 90% over the -O2. The savings that can be achieved are in the same range as what can be achieved by the state-of-the-art compilation approaches that use iterative compilation or machine learning to select flags or to determine phase orderings that result in more efficient code. In contrast to these time consuming and expensive to apply techniques, our approach only needs to test a limited number of optimization configurations, less than 64, to obtain similar or even better savings. Furthermore, our approach can support multi-criteria optimization as it targets execution time, energy consumption and code size at the same time.}, address = {New York, New York, USA}, archivePrefix = {arXiv}, arxivId = {1802.09845}, author = {Georgiou, Kyriakos and Blackmore, Craig and Xavier-de-Souza, Samuel and Eder, Kerstin}, booktitle = {Proceedings of the 21st International Workshop on Software and Compilers for Embedded Systems, SCOPES 2018}, doi = {10.1145/3207719.3207727}, eprint = {1802.09845}, isbn = {9781450357807}, keywords = {Autotuning,Compiler optimizations,Embedded systems,Energy consumption,Execution time,Phase-ordering}, month = {may}, pages = {35--42}, publisher = {Association for Computing Machinery, Inc}, title = {{Less is more: Exploiting the standard compiler optimization levels for better performance and energy consumption}}, url = {http://dl.acm.org/citation.cfm?doid=3207719.3207727}, year = {2018} } @misc{Georgiou2018a, abstract = {The Internet of Things (IoT) sparks a whole new world of embedded applications. Most of these applications are based on deeply embedded systems that have to operate on limited or unreliable sources of energy, such as batteries or energy harvesters. Meeting the energy requirements for such applications is a hard challenge, which threatens the future growth of the IoT. Software has the ultimate control over hardware. Therefore, its role is significant in optimizing the energy consumption of a system. Currently, programmers have no feedback on how their software affects the energy consumption of a system. Such feedback can be enabled by energy transparency, a concept that makes a program's energy consumption visible, from hardware to software. This letter discusses the need for energy transparency in software development and emphasizes on how such transparency can be realized to help tackle the IoT energy challenge.}, archivePrefix = {arXiv}, arxivId = {1706.08817}, author = {Georgiou, Kyriakos and Xavier-De-Souza, Samuel and Eder, Kerstin}, booktitle = {IEEE Embedded Systems Letters}, doi = {10.1109/LES.2017.2741419}, url = {https://www.doi.org/10.1109/LES.2017.2741419}, eprint = {1706.08817}, issn = {19430663}, keywords = {Energy efficiency,Internet of Things (IoT),software metrics}, month = {sep}, number = {3}, pages = {53--56}, publisher = {Institute of Electrical and Electronics Engineers Inc.}, title = {{The IoT Energy Challenge: A Software Perspective}}, volume = {10}, year = {2018} } @article{Goncalves-e-Silva2018, abstract = {We propose a parallel synchronous and asynchronous implementation of the coupled simulated annealing (CSA) algorithm in a shared-memory architecture. The original CSA was implemented synchronously in a distributed-memory architecture. It synchronizes at each temperature update, which leads to idling and loss of efficiency when increasing the number of processors. The proposed synchronous CSA (SCSA) is implemented as the original, but in a shared-memory architecture. The proposed asynchronous CSA (ACSA) does not synchronize, allowing a larger parallel efficiency for larger numbers of processors. Results from extensive experiments show that the proposed ACSA presents much better quality of solution when compared to the serial and to the SCSA. The experiments also show that the performance of the proposed ACSA is better than the SCSA for less computationally intensive problems or when a larger number of processing cores are available. Moreover, the parallel efficiency of the ACSA improves by increasing the size of the problem. With the advent of the Multi-core Era, the use of the proposed algorithm becomes more attractive than the original synchronous CSA.}, author = {Gonçalves-e-Silva, Kayo and Aloise, Daniel and Xavier-de-Souza, Samuel}, doi = {10.1007/s11227-018-2327-4}, issn = {15730484}, journal = {Journal of Supercomputing}, keywords = {Coupled simulated annealing,Global optimization,Parallel algorithms,Parallel efficiency}, month = {jun}, number = {6}, pages = {2841--2869}, publisher = {Springer New York LLC}, title = {{Parallel synchronous and asynchronous coupled simulated annealing}}, url = {https://link.springer.com/article/10.1007/s11227-018-2327-4}, volume = {74}, year = {2018} } @article{Goncalves-E-Silva2018, abstract = {Nelder-Mead method (NM) for solving continuous non-linear optimization problem is probably the most cited and the most used method in the optimization literature and in practical applications, too. It belongs to the direct search methods, those which do not use the first and the second order derivatives. The popularity of NM is based on its simplicity. In this paper we propose even more simple algorithm for larger instances that follows NM idea. We call it Simplified NM (SNM): instead of generating all n + 1 simplex points in Rn, we perform search using just q + 1 vertices, where q is usually much smaller than n. Though the results cannot be better than after performing calculations in n+1 points as in NM, significant speed-up allows to run many times SNM from different starting solutions, usually getting better results than those obtained by NM within the same cpu time. Computational analysis is performed on 10 classical convex and non-convex instances, where the number of variables n can be arbitrarily large. The obtained results show that SNM is more effective than the original NM, confirming that LIMA yields good results when solving a continuous optimization problem.}, author = {Gonçalves-E-Silva, Kayo and Aloise, Daniel and Xavier-De-Souza, Samuel and Mladenovic, Nenad}, doi = {10.2298/YJOR180120014G}, url = {https://www.doi.org/10.2298/YJOR180120014G}, issn = {23346043}, journal = {Yugoslav Journal of Operations Research}, keywords = {Continuous optimization,Direct search methods,Less is more approach,Nelder mead method}, month = {jun}, number = {2}, pages = {153--169}, publisher = {Faculty of Organizational Sciences, Belgrade}, title = {{Less is more: Simplified nelder-mead method for large unconstrained optimization}}, volume = {28}, year = {2018} } @article{Lima2018, abstract = {The current static management policy for spectrum allocation has shown to be inefficient when dealing with the increasing demand for wireless communication systems. More recently, opportunistic spectrum access has emerged as a promising alternative that allows non-licensed users to utilize the spectrum if no primary users are detected. Spectrum sensing based on cyclostationary feature detection can be employed to reliably identify the presence of primary users even at low SNR levels. However, the detection of modulated signals at lower SNR levels demands a higher number of analyzed samples. In this paper, we propose an architecture for spectrum sensing that enables the reduction of the computational time needed to obtain cyclostationary features of a signal when using multi-core processors. Simulation results show that the proposed architecture can achieve over 92.8% parallel efficiency, which leads to a reduction of spectrum sensing time by a factor of 29.7.}, author = {Lima, Arthur D.L. and Silveira, Luiz F.Q. and Xavier-de-Souza, Samuel}, doi = {10.1016/j.compeleceng.2018.07.016}, url = {https://www.doi.org/10.1016/j.compeleceng.2018.07.016}, issn = {00457906}, journal = {Computers and Electrical Engineering}, keywords = {Cognitive radio,Cyclic correlation,Cyclic detector,Cyclic feature detection,Parallel computing,Receiver sensitivity model}, month = {oct}, pages = {151--161}, publisher = {Elsevier Ltd}, title = {{Spectrum sensing with a parallel algorithm for cyclostationary feature extraction}}, volume = {71}, year = {2018} } @inproceedings{nunes2018, address = {João Pessoa}, author = {NUNES, E A F and SILVEIRA, LUIZ F Q and ALVES, D K and DANTAS, E S and PESSOA, G A P C A}, booktitle = {Anais do Congresso Brasileiro de Automática}, title = {{AVALIAÇÃO DO IMPACTO HARMÔNICO DE CORRENTE DEVIDO À INSERÇÃO DE SISTEMAS FOTOVOLTAICOS À REDE ELÉTRICA}}, year = {2018} } @inproceedings{Oliveira2018, abstract = {To make efficient use of multi-core processors, it is important to understand the performance behavior of parallel applications. Modeling this can enable the use of online approaches to optimize throughput or energy, or even guarantee a minimum QoS. Accurate models would avoid probe different runtime configurations, which causes overhead. Throughout the years, many speedup models were proposed. Most of them based on Amdahl's or Gustafson's laws. However, many of those make considerations such as a fixed parallel fraction, or a parallel fraction that varies linearly with problem size, and inexistent parallelization overhead. Although such models aid in the theoretical understanding, these considerations do not hold in real environments, which makes the modeling unsuitable for accurate characterization of parallel applications. The model proposed estimates the speedup taking into account the variation of its parallel fraction according to problem size, number of cores used and overhead . Using four applications from the PARSEC benchmark suite, the proposed model was able to estimate speedups more accurately than other models in recent literature.}, address = {New York, NY, USA}, author = {Oliveira, Victor H.F. and Georgiou, Kyriakos and Furtunato, Alex F.A. and Eder, Kerstin and Silveira, Luiz F. and Xavier-De-Souza, Samuel}, booktitle = {ICPE 2018 - Companion of the 2018 ACM/SPEC International Conference on Performance Engineering}, doi = {10.1145/3185768.3185770}, isbn = {9781450356299}, keywords = {Application Characterization,Parallel Computing,Performance Modeling}, month = {apr}, pages = {43--44}, publisher = {Association for Computing Machinery, Inc}, title = {{Application speedup characterization: Modeling parallelization overhead and variations of problem size and number of cores}}, url = {https://dl.acm.org/doi/10.1145/3185768.3185770}, volume = {2018-Janua}, year = {2018} } @inproceedings{santos2018, address = {Campina Grande}, author = {SANTOS, Y P and {LIMA FILHO}, F S and Fontes, A I R and Silveira, Luiz F Q}, booktitle = {Anais do XXXVI SIMPóSIO BRASILEIRO DE TELECOMUNICAÇÕES E PROCESSAMENTO DE SINAIS}, title = {{Sistema de Detecção de Patologias Vocais Baseado no Domínio Espectral da Correntropia}}, year = {2018}, url = {https://repositorio.ufrn.br/handle/123456789/26829} } @inproceedings{Silva2018, abstract = {The Block Recursive Inversion (BRI) algorithm calculates the inversion of large k x k block matrices with limited memory during the entire processing because it calculates one block of the inverse at a time. However, the lower memory consumption is counterbalanced by higher computational complexity. We propose a parallel BRI implementation, which also calculates one block at a time, to reduce execution time and extend its applicability by exploiting modern multi-core architectures. The proposed parallel BRI was implemented for shared memory systems in OpenMP. The results of a performance and scalability analysis for different use cases reveals opposite trends in execution time, with the proposed parallel implementation being faster for larger k. Although not weakly scalable for a fixed k, scalability tends to increase with the increase of k or, equivalently, with the reduction of memory requirements.}, author = {Silva, Maria Clara and Cosme, Iria C.S. and Sardina, Idalmis M. and Xavier-De-Souza, Samuel}, booktitle = {Proceedings - IEEE International Conference on Cluster Computing, ICCC}, doi = {10.1109/CLUSTER.2018.00029}, url = {https://www.doi.org/10.1109/CLUSTER.2018.00029}, isbn = {9781538683194}, issn = {15525244}, keywords = {Block Recursive Inversion,Large Matrices,Matrix Inversion,OpenMP}, month = {oct}, pages = {154--155}, publisher = {Institute of Electrical and Electronics Engineers Inc.}, title = {{Scalable Shared-Memory Parallelization of the Block Recursive Inversion Algorithm}}, volume = {2018-Septe}, year = {2018} } @inproceedings{Souza2018, author = {Souza, Pedro and Souza, Vinicius and Fontes, Aluísio and Silveira, Luiz}, booktitle = {Anais de XXXVI Simpósio Brasileiro de Telecomunicações e Processamento de Sinais}, doi = {10.14209/sbrt.2018.329}, publisher = {Sociedade Brasileira de Telecomunicações}, title = {{Projeto de constelações com símbolos não-equiprováveis adequadas ao sensoriamento espectral por características cicloestacionárias utilizando Simulated Annealing}}, url = {http://biblioteca.sbrt.org.br/articles/1793}, year = {2018} } @article{Aloise2017, abstract = {k-means is a benchmark algorithm used in cluster analysis. It belongs to the large category of heuristics based on location-allocation steps that alternately locate cluster centers and allocate data points to them until no further improvement is possible. Such heuristics are known to suffer from a phenomenon called degeneracy in which some of the clusters are empty. In this paper, we compare and propose a series of strategies to circumvent degenerate solutions during a k-means execution. Our computational experiments show that these strategies are effective, leading to better clustering solutions in the vast majority of the cases in which degeneracy appears in k-means. Moreover, we compare the use of our fixing strategies within k-means against the use of two initialization methods found in the literature. These results demonstrate how useful the proposed strategies can be, specially inside memorybased clustering algorithms.}, author = {Aloise, Daniel and Damasceno, Nielsen Castelo and Mladenovic, Nenad and Pinheiro, Daniel Nobre}, doi = {10.1007/s00357-017-9231-0}, issn = {14321343}, journal = {Journal of Classification}, keywords = {Clustering,Degeneracy,Heuristics,Minimum sum-of-squares,k-means}, month = {jul}, number = {2}, pages = {165--190}, publisher = {Springer New York LLC}, title = {{On Strategies to Fix Degenerate k-means Solutions}}, url = {https://link.springer.com/article/10.1007/s00357-017-9231-0}, volume = {34}, year = {2017} } @article{Cavalcante2017, abstract = {Future generation mobile communications running on mm-wave frequencies will require great robustness against frequency selective channels. In this paper, we evaluate the transmission performance of 4.9 Gb/s wavelet-coded orthogonal frequency division multiplexing (OFDM) signals on a 10 km fiber plus 58 m wireless radio-over-fiber link using a mm-wave radio frequency carrier. The results show that a 2 × 128 wavelet-coded OFDM system achieves a bit-error rate of 1e-4 with nearly 2.5 dB less signal-to-noise ratio than a convolutional coded OFDM system with equivalent spectral efficiency for 8 GHz-wide signals with 512 subcarriers on a carrier frequency of 86 GHz. Our findings confirm the Tzannes' theory that wavelet coding enables high diversity gains with a low complexity receiver and, most notably, without compromising the system's spectral efficiency.}, author = {Cavalcante, Lucas C.P. and Rommel, Simon and Dinis, Rui and Junior, L. G.Q.Silveira and Silveira, L. F.Q. and Monroy, Idelfonso Tafur}, doi = {10.1109/JLT.2017.2701358}, url = {https://www.doi.org/10.1109/JLT.2017.2701358}, issn = {07338724}, journal = {Journal of Lightwave Technology}, keywords = {Frequency selectivity,OFDM,W-band,mm-Wave,radio-over-fiber,wavelet-coding}, month = {jul}, number = {14}, pages = {2803--2809}, publisher = {Institute of Electrical and Electronics Engineers Inc.}, title = {{Performance evaluation of wavelet-coded OFDM on a 4.9 Gb/s W-Band Radio-Over-Fiber Link}}, volume = {35}, year = {2017} } @inproceedings{souza2017, address = {Cambridge, UK}, author = {de Souza, Samuel and NIKOV, K and NUNEZ-YANEZ, J and Eder, Kerstin}, booktitle = {Proceedings of Arm Research Summit}, title = {{The Energy Consumption Benefits of DynamIQ for Heterogeneous Parallel Workloads}}, url = {https://www.researchgate.net/publication/319914261_The_energy_consumption_benefits_of_DynamIQ_for_heterogeneous_parallel_workloads}, year = {2017} } @article{Fontes2017, abstract = {Information extraction is a frequent and relevant problem in digital signal processing. In the past few years, different methods have been utilized for the parameterization of signals and the achievement of efficient descriptors. When the signals possess statistical cyclostationary properties, the Cyclic Autocorrelation Function (CAF) and the Spectral Cyclic Density (SCD) can be used to extract second-order cyclostationary information. However,second-order statistics tightly depends on the assumption of gaussianity, as the cyclostationary analysis in this case should comprise higher-order statistical information. This paper proposes a new mathematical formulation for the higher-order cyclostationary analysis based on the correntropy function. The cyclostationary analysis is revisited focusing on the information theory, while the Cyclic Correntropy Function (CCF) and Cyclic Correntropy Spectral Density (CCSD) are also presented. The CCF has different properties compared with CAF that can be very useful in non-gaussian signal processing, especially in the impulsive noise environment which implies in the expansion of the class of problems addressed by the second-order cyclostationary analysis. In particular, we prove that the CCF contains information regarding second- and higher-order cyclostationary moments, being a generalization of the CAF. The performance of the aforementioned functions in the extraction of higher-order cyclostationary characteristics is analyzed in a wireless communication system in which non-gaussian noise is present. The results demonstrate the advantages of the proposed method over the second-order cyclostationary.}, author = {Fontes, Aluisio I.R. and Rego, Joilson B.A. and Martins, Allan de M. and Silveira, Luiz F.Q. and Principe, J. C.}, doi = {10.1016/j.eswa.2016.10.029}, url = {https://www.doi.org/10.1016/j.eswa.2016.10.029}, issn = {09574174}, journal = {Expert Systems with Applications}, keywords = {Correntropy,Cyclic correntropy function,Cyclic correntropy spectral density,Cyclostationary,Information extraction}, month = {mar}, pages = {110--117}, publisher = {Elsevier Ltd}, title = {{Cyclostationary correntropy: Definition and applications}}, volume = {69}, year = {2017} } @article{Gama2017, abstract = {Wireless control systems can sense, control and act on the information exchanged between the wireless sensor nodes in a control loop. However, the exchanged information becomes susceptible to the degenerative effects produced by the multipath propagation. In order to minimize the destructive effects characteristic of wireless channels, several techniques have been investigated recently. Among them, wavelet coding is a good alternative for wireless communications for its robustness to the effects of multipath and its low computational complexity. This work proposes an adaptive wavelet coding whose parameters of code rate and signal constellation can vary according to the fading level and evaluates the use of this transmission system in a control loop implemented by wireless sensor nodes. The performance of the adaptive system was evaluated in terms of bit error rate (BER) versus Eb/N0 and spectral efficiency, considering a time-varying channel with flat Rayleigh fading, and in terms of processing overhead on a control system with wireless communication. The results obtained through computational simulations and experimental tests show performance gains obtained by insertion of the adaptive wavelet coding in a control loop with nodes interconnected by wireless link. These results enable the use of this technique in a wireless link control loop.}, author = {Gama, Felipe and Silveira, Luiz and Salazar, Andrés}, doi = {10.3390/s17122901}, issn = {1424-8220}, journal = {Sensors}, keywords = {Control loop,Rayleigh fading,Time diversity,Wavelet coding,Wireless communications}, month = {dec}, number = {12}, pages = {2901}, publisher = {MDPI AG}, title = {{Adaptive Wavelet Coding Applied in a Wireless Control System}}, url = {http://www.mdpi.com/1424-8220/17/12/2901}, volume = {17}, year = {2017} } @inproceedings{Ichihara2017, abstract = {In this paper, a stochastic algorithm called Coupled Simulated Annealing (CSA) is used to develop a Nonlinear Model Predictive Control (NMPC) strategy that can deal with model parameter uncertainties. The adopted approach consists in formulating the NMPC as an optimization problem and using CSA to search for the solution. The computation of the control input is performed in two steps: first, based on past states and inputs data, CSA is used to minimize the states prediction error over the set of model parameters. The model is then updated and CSA is used to minimize a cost function over the predicted states and inputs. Simulation results show the effectiveness of the proposed controller for a model of highly nonlinear reactor with parametric uncertainties.}, author = {Ichihara, Danilo C S and Dórea, Carlos E T and Xavier-De-Souza, Samuel}, booktitle = {Anais do XIII Simpósio Brasileiro de Automação Inteligente}, keywords = {Adaptive strategy,Coupled simulated annealing (CSA),Nonlinear model predictive control (NMPC),Processes Control}, title = {{NONLINEAR MODEL PREDICTIVE CONTROL WITH ADAPTIVE STRATEGY USING COUPLED SIMULATED ANNEALING}}, url = {https://pdfs.semanticscholar.org/037f/5584af953ec73770248ef0163792cac30aed.pdf}, year = {2017} } @article{Pereira2017, abstract = {We propose an approach for the synchronization of video streams using correntropy. Essentially, the time offset is calculated on the basis of the instantaneous transfer rates of the video streams that are extracted in the form of a univariate signal known as variable bit-rate (VBR). The state-of-the-art approach uses a window segmentation strategy that is based on consensual zero-mean normalized cross-correlation (ZNCC). This strategy has an elevated computational complexity, making its application to synchronizing online data streaming difficult. Hence, our proposal uses a different window strategy that, together with the correntropy function, allows the synchronization to be performed for online applications. This provides equivalent synchronization scores with a rapid offset determination as the streams come into the system. The efficiency of our approach has been verified through experiments that demonstrate its viability with values that are as precise as those obtained by ZNCC. The proposed approach scored 81% in time reference classification against the equivalent 81% of the state-of-the-art approach, requiring much less computational power.}, author = {Pereira, Igor and Silveira, Luiz F. and Gonçalves, Luiz}, doi = {10.3390/s17092021}, issn = {1424-8220}, journal = {Sensors}, keywords = {Correntropy,Variable bit-rate,Video synchronization}, month = {sep}, number = {9}, pages = {2021}, publisher = {MDPI AG}, title = {{Video Synchronization With Bit-Rate Signals and Correntropy Function}}, url = {http://www.mdpi.com/1424-8220/17/9/2021}, volume = {17}, year = {2017} } @inproceedings{souza2017, address = {Brasília}, author = {SOUZA, W S and AZEVEDO, D G and de Souza, Samuel}, booktitle = {Anais do XVII Simpósio Brasileiro em Segurança da Informação e de Sistemas Computacionais}, title = {{Do back-end para o front-end: Uma Avaliação de Segurança de Aplicações Móveis da Justiça Eleitoral}}, year = {2017} } @inproceedings{Xavier-De-Souza2017, abstract = {Programmable circuits such as general-purpose processors or FPGAs have their end-user energy efficiency strongly dependent on the program that they execute. Ultimately, it is the programmer's ability to code and, in the case of general purpose processors, the compiler's ability to translate source code into a sequence of native instructions that make the circuit deliver the expected performance to the end user. This way, the benefits of energy-efficient circuits build upon energy-efficient devices could be obfuscated by poorly written software. Clearly, having well-written software running on conventional circuits is no better in terms of energy efficiency than having poorly written software running on energy-efficient circuits. Therefore, to get the most out of the energy-saving capabilities of programmable circuits that support low voltage operating modes, it is necessary to address software issues that might work against the benefits of operating in such modes.}, author = {Xavier-De-Souza, Samuel and Neves, Eduardo A. and Furtunato, Alex F.A. and Silveira, Luiz F.Q. and Georgiou, Kyriakos and Eder, Kerstin I.}, booktitle = {2017 5th Berkeley Symposium on Energy Efficient Electronic Systems, E3S 2017 - Proceedings}, doi = {10.1109/E3S.2017.8246198}, url = {https://www.doi.org/10.1109/E3S.2017.8246198}, isbn = {9781538632901}, month = {jun}, pages = {1--3}, publisher = {Institute of Electrical and Electronics Engineers Inc.}, title = {{The benefits of low operating voltage devices to the energy efficiency of parallel systems}}, volume = {2018-Janua}, year = {2017} } @inproceedings{Albuquerque2016, abstract = {This paper presents a new time-effective GPS acquisition algorithm that improves the Time to First Fix (TTFF) of hardware GPS receivers under power consumption or hardware constraints. Based on a modified Serial Search Acquisition Algorithm (SA), this enhanced alternative, called Reduced Two Steps Acquisition (RTSA), provides an average gain of 64.18% in number of SA calculations. In terms of speed-up RTSA was in average 3x faster than SA without needing additional hardware resources.}, author = {Albuquerque, Glauberto L.A. and Valderrama, Carlos and Silva, Fabrício Costa and Xavier-De-Souza, Samuel}, booktitle = {Proceedings of 2016 International Conference on Localization and GNSS, ICL-GNSS 2016}, doi = {10.1109/ICL-GNSS.2016.7533687}, url = {https://www.doi.org/10.1109/ICL-GNSS.2016.7533687}, isbn = {9781509017577}, keywords = {Cold Start,GPS,Global Positioning Systems}, month = {aug}, publisher = {Institute of Electrical and Electronics Engineers Inc.}, title = {{Time-effective GPS time domain signal Acquisition Algorithm}}, year = {2016} } @inproceedings{Araujo2016, abstract = {Serial and parallel implementations of a finite difference simulator for the dynamic behavior of directional suckerrod pumping wells that takes into account fluid flow inside the rod-tubing annulus are presented and analyzed. The performance and scalability of the implementations are compared. The results show that the parallel versions bring significant speed improvements over the serial versions in the majority of cases, and that the efficiency of the parallel versions scales along with problem size.}, author = {Araújo, Roger R.F. and Xavier-De-Souza, Samuel}, booktitle = {Proceedings of the 6th IASTED International Conference on Modelling, Simulation and Identification, MSI 2016}, doi = {10.2316/P.2016.840-023}, url = {https://www.doi.org/10.2316/P.2016.840-023}, isbn = {9780889869837}, keywords = {Directional wells,Dynamical systems,Finite difference methods,Parallelization,Sucker-rod pumping,Well design}, month = {aug}, pages = {89--98}, publisher = {Acta Press}, title = {{Parallel optimization of a simulation of dynamic behavior of directional sucker-rod pumping wells}}, year = {2016} } @article{C.Benjamim2016, abstract = {There are control systems in which sensors, actuators and controllers can't communicate by wired networks. In these environments, the use of wireless communications system is an alternative, but this can create other problems in the system, like delay and information loss. This paper investigates the performance of technique a Model Based Control (MBC) used to improve the response of a nonlinear invariant system, using a analogic circuit to simulate a tank level control, and analyzing the control behavior considering a communication with information loss. The results demonstrated that the technique improves the wireless control system.}, author = {{C. Benjamim}, Xiankleber and {S. Gama}, Felipe O. and Salazar, Andrés O and Silveira, Luiz F Q}, doi = {10.15662/IJAREEIE.2016.0509070}, issn = {23203765}, journal = {International Journal of Advanced Research in Electrical, Electronics and Instrumentation Engineering}, keywords = {Control System,Information Loss,Model Based Control,Wireless Communications}, month = {sep}, number = {9}, pages = {7512--7517}, title = {{Wireless Control System with Model Based Control}}, url = {http://ijareeie.com/upload/2016/september/53_Wireless.pdf}, volume = {5}, year = {2016} } @inproceedings{Cavalcante2016, abstract = {In this work, we evaluate the performance of Wavelet-Coding into offering robustness for OFDM signals against the combined effects of varying fading and noise bursts. Wavelet-Code enables high diversity gains with a low complex receiver, and, most notably, without compromising the system's spectral efficiency. The results show that the Wavelet-Coded OFDM system achieves a BER of 10-3 with nearly 6 dB less SNR than the convolutional coded OFDM system in frequency selective channels with a normalized channel response variation rate of $\zeta$ = 10-4. The proposed system fits as a key enabler for the use of mm-wave frequencies in future generation mobile communication due to its robustness against multipath fading.}, author = {Cavalcante, Lucas and Olmos, J. J.Vegas and Monroy, Idelfonso T. and Dinis, Rui and {De Silveira}, Luiz G.Q. and {De Silveira}, Luiz F.Q.}, booktitle = {IEEE Vehicular Technology Conference}, doi = {10.1109/VTCFall.2016.7881967}, url = {https://www.doi.org/10.1109/VTCFall.2016.7881967}, isbn = {9781509017010}, issn = {15502252}, month = {jul}, publisher = {Institute of Electrical and Electronics Engineers Inc.}, title = {{Wavelet-Coded OFDM for next generation mobile communications}}, volume = {0}, year = {2016} } @article{Cavalcante2016a, abstract = {Millimeter wave communications based on photonic technologies have gained increased attention to provide optic fiber-like capacity in wireless environments. However, the new hybrid fiber-wireless channel represents new challenges in terms of signal transmission performance analysis. Traditionally, such systems use diversity schemes in combination with digital signal processing techniques to overcome effects such as fading and inter-symbol interference (ISI). Wavelet Channel Coding (WCC) has emerged as a technique to minimize the fading effects of wireless channels, which is a mayor challenge in systems operating in the millimeter wave regime. This work takes the WCC one step beyond by performance evaluation in terms of bit error probability, over time-varying, frequency-selective multipath Rayleigh fading channels. The adopted propagation model follows the COST207 norm, the main international standard reference for GSM, UMTS, and EDGE applications. The results show how WCC can be efficient against ISI. To the best of our knowledge this is the first time WCC is considered on Radio-over-Fiber transmissions at mm-wave range.}, author = {Cavalcante, Lucas and Silveira, Luiz F.Q. and Rommel, Simon and {Vegas Olmos}, J. J. and {Tafur Monroy}, I.}, doi = {10.1007/s11082-015-0284-1}, issn = {1572817X}, journal = {Optical and Quantum Electronics}, keywords = {Doppler shift,Frequency selective fading,Millimeter-wave communications,Radio-over-fiber,Wavelet channel coding,Wireless communications}, month = {jan}, number = {1}, pages = {1--9}, publisher = {Springer New York LLC}, title = {{Performance analysis of wavelet channel coding in COST207-based channel models on simulated radio-over-fiber systems at the W-band}}, url = {https://link.springer.com/article/10.1007/s11082-015-0284-1}, volume = {48}, year = {2016} } @inproceedings{DeQueirozSilveira2016, abstract = {Since its advent, the wavelet filtering technique provides time-diversity gains to M-ary digital communications systems, while it keeps their spectral efficiency unaffected. However, the receiver design is more critical under this novel time-diversity transmission system. To tackle this problem, we propose a MMSE-based receiver. This paper presents the performance evaluation of a novel wavelet-filtered based system over flat Rayleigh fading channel. The results so obtained show the effectiveness of the proposed approach, giving rise to outstanding performance gains over conventional amplitude/phase modulations with the same spectral efficiency.}, author = {{De Queiroz Silveira}, Luiz Gonzaga and {De Queiroz Silveira}, Luiz Felipe}, booktitle = {EUCNC 2016 - European Conference on Networks and Communications}, doi = {10.1109/EuCNC.2016.7560994}, url = {https://www.doi.org/10.1109/EuCNC.2016.7560994}, isbn = {9781509028931}, month = {sep}, pages = {6--10}, publisher = {Institute of Electrical and Electronics Engineers Inc.}, title = {{MMSE-based receiver for wavelet-filtered systems over flat fading channels}}, year = {2016} } @inproceedings{silva2016c, address = {Natal}, author = {SILVA, M. R. ; ALSINA, P. J. ; MEDEIROS, A. A. D. ; SILVEIRA, L. F. Q. ; NOGUEIRA, M. ; ALBUQUERQUE, G. L. A. ; DANTAS, J.}, booktitle = {Anais do Fórum de Pesquisa e Inovação do CLBI}, title = {{Especificação de Arquitetura de Rede de Comunicação para Sistema Multi VANT Aplicado à Varredura de Área de Impacto de Foguetes}}, year = {2016} } @inproceedings{gama2016, address = {Lima}, author = {GAMA, F O S and Fonseca, D A M and BENJAMIM, X C and SALAZAR, A O and SILVEIRA, L F Q}, booktitle = {Anais do VII Congresso Internacional de Computación y Telecomunicaciones}, title = {{Perspectiva de Redes de Sensores Sem fio em um Sistema de Controle de Malha Fechada}}, url = {https://www.researchgate.net/publication/308766125_Perspectiva_de_Redes_de_Sensores_Sem_fio_em_um_Sistema_de_Controle_de_Malha_Fechada}, year = {2016} } @inproceedings{Gama2016, abstract = {The advance in wireless sensor networking technology is increasing the number of control systems that use these networks to transmit the relevant variable to be measured and controlled, despite of the more intense distortions caused by wireless channels. The performance of wireless communications systems is mainly limited by fading produced by multipath propagation. In order to minimize the fading effects, channel coding and diversity techniques are often used in wireless systems. Among the known coding techniques in the literature, the wavelet coding presents an interesting alternative to overcome the multipath fading, since it gets performance gain by transmitting in time diversity without compromising spectral efficiency. This paper investigates the use of wavelet coding in a system that operates over a wireless channel to control the rotation frequency of the direct current motor. Aspects such as packet error probability performance, hardware complexity and processing delays due to wavelet coding are analyzed, as well as its beneficial effects on the control system. In the proposed system, the wavelet coding was embedded in PIC microcontroller and a radio transceiver XBee is used to establish a wireless link. The obtained results demonstrate a reduction of fading effects on the control signal, as well as, a low cost for hardware implementation and a small impact on system processing time.}, author = {Gama, Felipe O.S. and Fernandes, Jefferson D. and Semente, Rodrigo S. and Salazar, Andres O. and Silveira, Luiz F.Q.}, booktitle = {2016 1st Symposium on Instrumentation Systems, Circuits and Transducers, INSCIT 2016 - Proceedings}, doi = {10.1109/INSCIT.2016.7598193}, url = {https://www.doi.org/10.1109/INSCIT.2016.7598193}, isbn = {9781509033027}, keywords = {Wavelet Coding,Wireless Communications}, month = {oct}, pages = {49--54}, publisher = {Institute of Electrical and Electronics Engineers Inc.}, title = {{Application of wavelet coding in a control system using wireless sensor networks}}, year = {2016} } @inproceedings{Guimaraes2016, abstract = {The System identification explores ways to obtain mathematical models of an unknown system. However, as a result from the intrinsic random nature of system or from the environment noise, it is very hard to find a perfect mathematical representation of a real system. This paper aims to evaluate the Maximum Correntropy Criterion (MCC) performance using the gradient descent and the Fixed-Point. Both methods were compared in different noise scenarios and their behavior with different system models. The importance of the free parameters was also studied on both methods. The results show that the fixed-point has a better performance and are less noise sensitive.}, author = {Guimaraes, Joao P.F. and Fontes, Aluisio I.R. and Rlgo, Joilson B.A. and Silveira, Luiz F.Q. and Martins, Allan M.}, booktitle = {Proceedings of the 2016 IEEE Conference on Evolving and Adaptive Intelligent Systems, EAIS 2016}, doi = {10.1109/EAIS.2016.7502500}, url = {https://www.doi.org/10.1109/EAIS.2016.7502500}, isbn = {9781509025831}, month = {jun}, pages = {110--113}, publisher = {Institute of Electrical and Electronics Engineers Inc.}, title = {{Performance evaluation of the maximum correntropy criterion in identification systems}}, year = {2016} } @inproceedings{silvad2016, address = {Málaga}, author = {SILVA, K G and Aloise, Daniel and Xavier-de-Souza, Samuel and MLADENOVIC, N}, booktitle = {Proceedings of the 4th International Conference on Variable Neighborhood Search}, title = {{Shorten Nelder-Mead for global optimization}}, year = {2016} } @inproceedings{silva2016b, address = {Recife}, author = {SILVA, M R and ALSINA, P J and MEDEIROS, A A D and SILVEIRA, L F Q and NOGUEIRA, M and ALBUQUERQUE, G L A and DANTAS, J}, booktitle = {Anais do Workshop de Teses e Dissertações de Robótica}, title = {{Especificação de Arquitetura de Rede de Comunicação para Sistema Multi VANT Aplicado à Varredura de Área de Impacto de Foguetes}}, year = {2016} } @inproceedings{silva2016, address = {Natal}, author = {SILVA, M R and MONTEIRO, F and ALSINA, P J and MEDEIROS, A A D and SILVEIRA, L F Q and NOGUEIRA, M and ALBUQUERQUE, G L A and DANTAS, J}, booktitle = {Anais da Escola Potiguar de Computação e suas Aplicações}, title = {{Análise Comparativa de Estratégias de Varredura de Área para um Sistema de Comunicação Multi Vants no Monitoramento da Área de Impacto de Foguetes Sobre o Mar}}, year = {2016} } @inproceedings{Souza2016, author = {Souza, Pedro and Souza, Vinícius and Silveira, Luiz F.}, booktitle = {Anais de XXXIV Simpósio Brasileiro de Telecomunicações}, doi = {10.14209/sbrt.2016.128}, publisher = {Sociedade Brasileira de Telecomunicações}, title = {{Desenvolvimento de um Sistema com Codificação Wavelet em GNU Radio Companion}}, url = {http://biblioteca.sbrt.org.br/articles/1199}, year = {2016} } @inproceedings{Souza2016a, author = {Souza, Pedro and Souza, Vinícius and Silveira, Luiz}, booktitle = {Anais de XXXIV Simpósio Brasileiro de Telecomunicações}, doi = {10.14209/sbrt.2016.149}, publisher = {Sociedade Brasileira de Telecomunica{\c{c}}{\~{o}}es}, title = {Arquitetura Inteligente de Sensoriamento Espectral por Análise de Cicloestacionariedades}, url = {http://biblioteca.sbrt.org.br/articles/1447}, year = {2016} } @article{Barros2015, abstract = {Abstract With the increase in the number of cores in processor chips observed in recent years, design choices - such as the number of cores in chip, the amount of resources per core, and whether to design homogeneous or heterogeneous chips - need to be given proper support. Several studies on heterogeneous multi-core processors are concerned with performance improvements. In this work, we propose mathematical models to analyze some of these design issues with focus on the reduction of processor dynamic energy. In particular, these models allow the comparison of the dynamic-energy consumption of multi-core architectures when they execute a workload in the same amount of time while allowing different core operating frequency between the compared architectures. The results of the analysis allow chip designers to choose the right conditions for optimal energy savings in heterogeneous multi-core chips based on the parallel fraction of the workloads and on the distributions of the resources among the cores in the chip. Under a simplified context, the devised models agree with the consolidated knowledge that heterogeneous multi-core chips have considerable advantage over homogeneous multi-core and single-core architectures in terms of energy efficiency.}, author = {Barros, Carlos Avelino and {De Queiroz}, Luiz Felipe and Valderrama, Carlos Alberto and Xavier-De-Souza, Samuel}, doi = {10.1016/j.micpro.2015.05.009}, url = {https://www.doi.org/10.1016/j.micpro.2015.05.009}, issn = {01419331}, journal = {Microprocessors and Microsystems}, keywords = {CMOS power,Energy savings,Heterogeneous architectures,Multi-core processors,Parallel scalability}, month = {jul}, number = {6}, pages = {418--425}, publisher = {Elsevier B.V.}, title = {{Optimal processor dynamic-energy reduction for parallel workloads on heterogeneous multi-core architectures}}, volume = {39}, year = {2015} } @article{Fontes2015, abstract = {Automatic modulation classification (AMC) techniques have applications in a variety of wireless communication scenarios, such as adaptive systems, cognitive radio, and surveillance systems. However, a common requirement to most of the AMC techniques proposed in the literature is the use of signal preprocessing modules, which can increase the computational cost and decrease the scalability of the AMC strategy. This work proposes the direct use of a similarity measure based on information theory for the automatic recognition of digital modulations, which is known as correntropy coefficient. The performance of correntropy in AMC applied to channels subject to additive white Gaussian noise (AWGN) is evaluated. Specifically, the influence of the kernel size on the classifier performance is analyzed, since it is the only free parameter in correntropy. Besides, a relationship between its respective value and the signal-to-noise ratio (SNR) of the channel is also proposed. Considering the investigated modulation techniques, numerical results obtained by simulation demonstrate that there are high accuracy rates in classification, even at low SNR values. By using correntropy, AMC task becomes simpler and more efficient. {\textcopyright} 2014 Elsevier Ltd. All rights reserved.}, author = {Fontes, Aluisio I.R. and {De M. Martins}, Allan and Silveira, Luiz F.Q. and Principe, J. C.}, doi = {10.1016/j.eswa.2014.07.023}, url = {https://www.doi.org/10.1016/j.eswa.2014.07.023}, issn = {09574174}, journal = {Expert Systems with Applications}, keywords = {Automatic modulation classification,Correntropy coefficient,Information theory}, month = {jan}, number = {1}, pages = {1--8}, publisher = {Elsevier Ltd}, title = {{Performance evaluation of the correntropy coefficient in automatic modulation classification}}, volume = {42}, year = {2015} } @article{gama2015, author = {GAMA, F O S and SEMENTE, R S and SILVEIRA, L F Q}, journal = {WSEAS TRANSACTIONS on COMMUNICATIONS}, pages = {89--95}, title = {{Development of a Wavelet Encoder in FPGA}}, url = {https://www.wseas.org/multimedia/journals/communications/2015/a245704-614.pdf}, volume = {14}, year = {2015} } @article{Linhares2015, abstract = {Recent researches have demonstrated that the Fuzzy Wavelet Neural Networks (FWNNs) are an efficient tool to identify nonlinear systems. In these structures, features related to fuzzy logic, wavelet functions, and neural networks are combined in an architecture similar to the Adaptive Neurofuzzy Inference Systems (ANFIS). In practical applications, the experimental data set used in the identification task often contains unknown noise and outliers, which decrease the FWNN model reliability. In order to reduce the negative effects of these erroneous measurements, this work proposes the direct use of a similarity measure based on information theory in the FWNN learning procedure. The Mean Squared Error (MSE) cost function is replaced by the Maximum Correntropy Criterion (MCC) in the traditional error backpropagation (BP) algorithm. The input-output maps of a real nonlinear system studied in this work are identified from an experimental data set corrupted by different outliers rates and additive white Gaussian noise. The results demonstrate the advantages of the proposed cost function using the MCC as compared to the MSE. This work also investigates the influence of the kernel size on the performance of the MCC in the BP algorithm, since it is the only free parameter of correntropy.}, author = {Linhares, Leandro L S and Fontes, Aluisio I R and Martins, Allan M and Araújo, Fábio M U and Silveira, Luiz F Q}, doi = {10.1155/2015/678965}, editor = {Zhang, Yudong}, issn = {1024-123X}, journal = {Mathematical Problems in Engineering}, pages = {678965}, publisher = {Hindawi Publishing Corporation}, title = {{Fuzzy Wavelet Neural Network Using a Correntropy Criterion for Nonlinear System Identification}}, url = {https://doi.org/10.1155/2015/678965}, volume = {2015}, year = {2015} } @article{Nunes-Do-Rosario2015, abstract = {Seismic imaging has evolved significantly due to the high demand from the oil/gas industry for hardware technological advancements, boosting the development of more sophisticated algorithms. In order to deliver the quality and accuracy required, the execution of these algorithms may lead to time infeasible solutions. Aiming at performance improvement, this work conducted the parallelization of the core of a reverse time migration (RTM) algorithm. Furthermore, analysis such as speedup and efficiency was performed in order to assess the scalability of the proposed method. While the many parallelization efforts so far deal with coarse-grain approaches, this letter tackles the intrashot fine-grain parallelization of prestack RTM, which increases the overall concurrency degree of the algorithm. Results using 2-D synthetic data show that the proposed approach is scalable, which means that an increase in hardware resources and/or in problem size will lead to a proportional increase in speed and/or accuracy.}, author = {Nunes-Do-Rosário, Desnes A. and Xavier-De-Souza, Samuel and Maciel, Rosangela C. and Costa, Jessé C.}, doi = {10.1109/LGRS.2015.2482481}, url = {https://www.doi.org/10.1109/LGRS.2015.2482481}, issn = {1545598X}, journal = {IEEE Geoscience and Remote Sensing Letters}, keywords = {Algorithm design and analysis,Computational modeling,Imaging,Multicore processing,Parallel processing,Runtime,Scalability}, month = {dec}, number = {12}, pages = {2433--2437}, publisher = {Institute of Electrical and Electronics Engineers Inc.}, title = {{Parallel Scalability of a Fine-Grain Prestack Reverse Time Migration Algorithm}}, volume = {12}, year = {2015} } @inproceedings{rego2015, address = {Natal}, author = {REGO, J B A and Fontes, A I R and {Dória Neto}, A D and SILVEIRA, L F Q and {DE M. MARTINS}, ALLAN}, booktitle = {Anais do Simpósio Brasileiro de Automação Inteligente}, title = {{Linear Regression Based on Correntropy for Sensor Calibration}}, url = {http://www.lii.dca.ufrn.br/download/artigo/332}, year = {2015} } @inproceedings{Silva2015, address = {Honolulu}, author = {Silva, Fabrício Costa and Xavier-de-Souza, Samuel and Silveira, Luiz F. Q. and Mota, Francisco das Chagas and de Albuquerque, Glauberto Leilson Alves and Valderrama, Carlos Alberto}, booktitle = {Proceedings of the ION 2015 Pacific PNT Meeting}, issn = {2331-6284}, month = {apr}, pages = {629--634}, title = {{Two-step Low Complexity GPS Signal Acquisition}}, url = {http://www.ion.org/publications/abstract.cfm?jp=p&articleID=12751}, year = {2015} } @inproceedings{Silveira2015, abstract = {As originally designed, the wavelet coding technique efficiently overcomes the fading effects, but limits the spectral efficiency of these systems to 1 bit/s/Hz. Furthermore, the coded symbols are modulated by unusual signal constellations that need to be designed by optimization methods. An alternative approach based on wavelet matrix to increases the communication system robustness to time-varying fading is proposed in another work by the same authors. This can be easily adapted to any wireless communication system maintaining its original spectral efficiency. However the derivation of receiving strategies is more critical under this novel wavelet-matrix based systems. This paper presents a receiving strategies which is show to be simple and effective, giving rise to outstanding performance gains over conventional amplitude/phase modulations with the same spectral efficiency.}, author = {Silveira, Luiz F.Q. and Silveira, Luiz G.De Q. and {De Assis}, Francisco M. and Pinto, Ernesto Leite}, booktitle = {SBMO/IEEE MTT-S International Microwave and Optoelectronics Conference Proceedings}, doi = {10.1109/IMOC.2015.7369171}, url = {https://www.doi.org/10.1109/IMOC.2015.7369171}, isbn = {9781467394925}, month = {dec}, publisher = {Institute of Electrical and Electronics Engineers Inc.}, title = {{Low-complexity receiver for wavelet-filtered M-ary modulations over flat-fading channels}}, volume = {2015-Decem}, year = {2015} } @inproceedings{Xavier-De-Souza2015, abstract = {Before the current computational era, when the most common processors had a single processing core, the speed of computation was mainly defined by the speed of that core. Faster cores usually reflected in faster algorithms and applications. In the current era, the speed of computation is no longer primarily boosted by faster cores. Due to the thermal effect known as the power wall, the increment in speed that can be reached from one processor generation to another is very limited. The power wall is not the only limiting factor though. The degree of instruction level parallelism has also reached far in the law of diminishing returns. Today's era is governed by multi-core processors. The power wall was circumvented with task level parallelism. The downside is that many applications may not effortlessly become faster with new generations of processors. In the multi-core era, faster algorithms are obtained with a combination of more processing cores and a good exploration of task level parallelism, meaning that algorithm designers have now an active roll in sustaining the performance of their application through generations of processors.}, author = {Xavier-De-Souza, Samuel and Barros, Carlos A. and Jales, Marcio O. and Silveira, Luiz F.Q.}, booktitle = {2015 4th Berkeley Symposium on Energy Efficient Electronic Systems, E3S 2015 - Proceedings}, doi = {10.1109/E3S.2015.7336814}, url = {https://www.doi.org/10.1109/E3S.2015.7336814}, isbn = {9781467385688}, keywords = {Energy measurement,Multicore processing,Power measurement,Program processors,Time measurement,Time-frequency analysis}, month = {nov}, publisher = {Institute of Electrical and Electronics Engineers Inc.}, title = {{Not faster nor slower tasks, but less energy hungry and parallel: Simulation results}}, year = {2015} } @article{DeSouza2014, abstract = {Introduction: Patient monitoring will tend to decline in the coming years due to a shortage of physical and human resources in hospitals. Therefore, several studies define alternatives to improve patient monitoring using wireless networks. In these studies, a wireless network is used to transfer data generated by medical sensors without interacting with the traffic in the data network of the hospital. However, this approach should be avoided because there are demands for integration between user applications and patient monitoring. Therefore, this paper defines a patient monitoring system, called Wi-Bio, directed to the establishment of IEEE 802.11 networks that allows traffic generated by user applications. Methods: The formal validation of Wi- Bio was made through the design of Petri nets, and performance analysis was performed through simulations of the Network Simulator 2 tool. The adoption of this approach is justified by the fact that Petri nets allow verification of logical correctness of the designed systems, while simulations allow behavioral analysis of Wi-Bio in overload scenarios where many patients are monitored. Results: The results confirmed the validity of the designed Petri nets and showed that Wi-Bio is able to accomplish the temporal goals imposed by medical sensors, thereby promoting efficient integration of traffic present in the data network and the patient monitoring network. Conclusion: As described, Wi-Bio fulfilled its objectives and motivates future studies aimed at complementing the obtained results.}, author = {de Souza, Vinícius Samuel Valério and Valentim, Ricardo Alexsandro de Medeiros and Brandão, Gláucio Bezerra and Silveira, Luiz Felipe de Queiroz and Dantas, Marcel da Câmara Ribeiro and de Souza, Pedro Thiago Valério}, doi = {10.1590/rbeb.2014.010}, issn = {19847742}, journal = {Revista Brasileira de Engenharia Biomedica}, keywords = {IEEE 802.11,Patient monitoring,Petri nets and Network Simulator 2,Wi-Bio}, number = {2}, pages = {144--158}, publisher = {Sociedade Brasileira de Engenharia Biomedica}, title = {{Wi-Bio: Management policy aimed at the establishment of networks for patient monitoring using IEEE 802.11}}, url = {http://dx.doi.org/10.1590/rbeb.2014.010}, volume = {30}, year = {2014} } @article{Fontes2014, abstract = {This paper proposes the use of a similarity measure based on information theory called correntropy for the automatic classification of pathological voices. By using correntropy, it is possible to obtain descriptors that aggregate distinct spectral characteristics for healthy and pathological voices. Experiments using computational simulation demonstrate that such descriptors are very efficient in the characterization of vocal dysfunctions, leading to a success rate of 97&{\#}x25; in the classification. With this new architecture, the classification process of vocal pathologies becomes much more simple and efficient.}, author = {Fontes, Aluisio I R and Souza, Pedro T V and Neto, Adrião D D and Martins, Allan de M and Silveira, Luiz F Q}, doi = {10.1155/2014/924786}, editor = {Wong, Pak-Kin}, issn = {1024-123X}, journal = {Mathematical Problems in Engineering}, pages = {924786}, publisher = {Hindawi Publishing Corporation}, title = {{Classification System of Pathological Voices Using Correntropy}}, url = {https://doi.org/10.1155/2014/924786}, volume = {2014}, year = {2014} } @article{LIMA2014, abstract = {The evolution of wireless communication systems leads to Dynamic Spectrum Allocation for Cognitive Radio, which requires reliable spectrum sensing techniques. Among the spectrum sensing methods proposed in the literature, those that exploit cyclostationary characteristics of radio signals are particularly suitable for communication environments with low signal-to-noise ratios, or with non-stationary noise. However, such methods have high computational complexity that directly raises the power consumption of devices which often have very stringent low-power requirements. We propose a strategy for cyclostationary spectrum sensing with reduced energy consumption. This strategy is based on the principle that p processors working at slower frequencies consume less power than a single processor for the same execution time. We devise a strict relation between the energy savings and common parallel system metrics. The results of simulations show that our strategy promises very significant savings in actual devices. Copyright {\textcopyright} 2014 The Institute of Electronics, Information and Communication Engineers.}, author = {LIMA, Arthur D.D. and BARROS, Carlos A. and SILVEIRA, Luiz Felipe Q. and XAVIER-DE-SOUZA, Samuel and VALDERRAMA, Carlos A.}, doi = {10.1587/transcom.E97.B.326}, issn = {0916-8516}, journal = {IEICE Transactions on Communications}, keywords = {Cognitive radio,Cyclostationarity,Low power,Parallel scalability,Spectrum sensing}, month = {feb}, number = {2}, pages = {326--333}, publisher = {Institute of Electronics, Information and Communication, Engineers, IEICE}, title = {{Parallel Cyclostationarity-Exploiting Algorithm for Energy-Efficient Spectrum Sensing}}, url = {http://jlc.jst.go.jp/DN/JST.JSTAGE/transcom/E97.B.326?lang=en&from=CrossRef&type=abstract}, volume = {E97.B}, year = {2014} } @article{RegoFontes2014, abstract = {Background: Similarity measures have application in many scenarios of digital image processing. The correntropy is a robust and relatively new similarity measure that recently has been employed in various engineering applications. Despite other competitive characteristics, its computational cost is relatively high and may impose hard-to-cope time restrictions for high-dimensional applications, including image analysis and computer vision. Methods: We propose a parallelization strategy for calculating the correntropy on multi-core architectures that may turn the use of this metric viable in such applications. We provide an analysis of its parallel efficiency and scalability. Results: The simulation results were obtained on a shared memory system with 24 processing cores for input images of different dimensions. We performed simulations of various scenarios with images of different sizes. The aim was to analyze the parallel and serial fraction of the computation of the correntropy coefficient and the influence of these fractions in its speedup and efficiency. Conclusions: The results indicate that correntropy has a large potential as a metric for image analysis in the multi-core era due to its high parallel efficiency and scalability.}, author = {{Rêgo Fontes}, Aluisio I. and Xavier-de-Souza, Samuel and {Dória Neto}, Adrião D. and {de Queiroz Silveira}, Luiz Felipe}, doi = {10.1186/s13173-014-0018-4}, issn = {16784804}, journal = {Journal of the Brazilian Computer Society}, keywords = {Correntropy,Multi-core architecture,Parallel efficiency,Parallel scalability,Similarity measures}, month = {dec}, number = {1}, pages = {18}, publisher = {Springer London}, title = {{On the parallel efficiency and scalability of the correntropy coefficient for image analysis}}, url = {https://journal-bcs.springeropen.com/articles/10.1186/s13173-014-0018-4}, volume = {20}, year = {2014} } @inproceedings{Souza-de-Assis2014b, address = {Rio de Janeiro}, author = {Souza-de-Assis, Italo A. and Nunes-do-Rosário, D. A. and Maciel, R. C. and Xavier-de-Souza, S.}, booktitle = {Rio Oil & Gas Expo and Conference}, keywords = {Souza-de-Assis2014b}, title = {{Um Algoritmo Paralelo Eficiente de Propagação de Onda Acústica 3D}}, year = {2014}, url = {https://www.researchgate.net/publication/317239391_UM_ALGORITMO_PARALELO_EFICIENTE_DE_PROPAGACAO_DE_ONDA_ACUSTICA_3D} }
.
.
p.
.
[bibtex]