<?xml version="1.0" encoding="UTF-8"?><rdf:RDF xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#" xmlns:dc="http://purl.org/dc/elements/1.1/" xmlns:dcq="http://purl.org/dc/terms/"><records count="1" morepages="false" start="1" end="1"><record rownumber="1"><dc:product_type>Journal Article</dc:product_type><dc:title>D-STACK: High Throughput DNN Inference by Effective Multiplexing and Spatio-Temporal Scheduling of GPUs</dc:title><dc:creator>Dhakal, Aditya; Kulkarni, Sameer G; Ramakrishnan, K K</dc:creator><dc:corporate_author/><dc:editor/><dc:description/><dc:publisher>IEEE</dc:publisher><dc:date>2024-10-01</dc:date><dc:nsf_par_id>10580065</dc:nsf_par_id><dc:journal_name>IEEE Transactions on Cloud Computing</dc:journal_name><dc:journal_volume>12</dc:journal_volume><dc:journal_issue>4</dc:journal_issue><dc:page_range_or_elocation>1344 to 1358</dc:page_range_or_elocation><dc:issn>2372-0018</dc:issn><dc:isbn/><dc:doi>https://doi.org/10.1109/TCC.2024.3476210</dc:doi><dcq:identifierAwardId>1823270</dcq:identifierAwardId><dc:subject/><dc:version_number/><dc:location/><dc:rights/><dc:institution/><dc:sponsoring_org>National Science Foundation</dc:sponsoring_org></record></records></rdf:RDF>