@article{oai:kanazawa-u.repo.nii.ac.jp:00008995, author = {Hirano, Akihiro and Nakayama, Kenji}, journal = {第26回信号処理シンポジウム講演論文集 = Proc. of 25th SIP Symposium}, month = {Jan}, note = {This paper presents efficient implementa- tion of RLS-based adaptive filters with a large number of taps on nVIDIA GeForce graphics processing unit (GPU) and CUDA software development environment. Modification of the order and the combination of calcu- lations reduces the number of accesses to slow off-chip memory. Assigning tasks into multiple threads also takes memory access order into account. For a 4096-tap case, a GPU program is almost three times faster than a CPU program.}, pages = {477--481}, title = {Implementation of RLS-based Adaptive Filterson nVIDIA GeForce Graphics Processing Unit}, year = {2011} }