@article{1479, author = {Saad Zafar, Numair Zulfiqar}, title = {Hardware Architecture Design and Mapping of ‘Fast Inverse Square Root’ Algorithm}, journal = {Electronic Devices}, year = {2014}, volume = {3}, number = {1}, doi = {}, url = {http://www.dline.info/ed/fulltext/v3n1/4.pdf}, abstract = {The Fast Inverse Square Root algorithm has been used in 3D games of past for lighting and reflection calculations, because it offers up to four times performance gains. This paper presents a hardware implementation of the same algorithm on an FPGA board by designing the complete architecture and successfully mapping it on Xilinx Spartan 3E after thorough functional verification. The results show that this implementation provides a very efficient single-precision floating point inverse square root calculator with a practically accurate result being made available after just 12 short clock cycles. This performance measure is far superior to the software counterpart of the algorithm, and is not processor dependent like rsqrtss of x86 SSE instruction set. Results of this work can aid FPGA based vector processors or graphic processing units with 3D rendering. The hardware design can also form part of a larger floating point arithmetic unit for dedicated reciprocal square root calculations.}, }