@inproceedings{63c02b07f0c94ab192a97862c1d992d4,
title = "Collision array based workload assignment for Network-on-Chip concurrency",
abstract = "To improve Network-on-Chip (NoC) parallelism, this paper proposes a new collision array based workload assignment to increase data request cancellation. Through a task flow partitioning algorithm, we minimize sequential data access and then dynamically schedule tasks while minimizing router execution time. Experimental results show that this method can provide an average of 87.7\% system throughput improvement and 41.4\% router execution time reduction. This throughput improvement is the direct consequence of collision array. A 7x improvement was reported in [10] Fig. 7 when 32 threads are employed on a single core. The system can achieve 2.7 times of speedup. By investigating the performance-overhead tradeoff between different collision array sizes, we proved a maximum of 42.9\% energy and area overheads saving, only with a cost of 23.6\% performance degradation in term of router execution time.",
keywords = "Network-on-Chip system, collision array, parallelism, workload assignment",
author = "He Zhou and Powers, \{Linda S.\} and Roveda, \{Janet M.\}",
note = "Publisher Copyright: {\textcopyright} 2014 IEEE.; 27th IEEE International System on Chip Conference, SOCC 2014 ; Conference date: 02-09-2014 Through 05-09-2014",
year = "2014",
month = nov,
day = "5",
doi = "10.1109/SOCC.2014.6948924",
language = "English (US)",
series = "International System on Chip Conference",
publisher = "IEEE Computer Society",
pages = "188--191",
editor = "Kaijian Shi and Thomas Buchner and Danella Zhao and Ramalingam Sridhar",
booktitle = "International System on Chip Conference",
}