{"id":"https://openalex.org/W4211050422","doi":"https://doi.org/10.1145/3463911","title":"DirectNVM: Hardware-accelerated NVMe SSDs for High-performance Embedded Computing","display_name":"DirectNVM: Hardware-accelerated NVMe SSDs for High-performance Embedded Computing","publication_year":2022,"publication_date":"2022-01-31","ids":{"openalex":"https://openalex.org/W4211050422","doi":"https://doi.org/10.1145/3463911"},"language":"en","primary_location":{"id":"doi:10.1145/3463911","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3463911","pdf_url":null,"source":{"id":"https://openalex.org/S136160450","display_name":"ACM Transactions on Embedded Computing Systems","issn_l":"1539-9087","issn":["1539-9087","1558-3465"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319798","host_organization_name":"Association for Computing Machinery","host_organization_lineage":["https://openalex.org/P4310319798"],"host_organization_lineage_names":["Association for Computing Machinery"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ACM Transactions on Embedded Computing Systems","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5090610227","display_name":"Yu Zou","orcid":"https://orcid.org/0000-0002-4541-6638"},"institutions":[{"id":"https://openalex.org/I106165777","display_name":"University of Central Florida","ror":"https://ror.org/036nfer12","country_code":"US","type":"education","lineage":["https://openalex.org/I106165777"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Yu Zou","raw_affiliation_strings":["University of Central Florida, Orlando, FL, US"],"affiliations":[{"raw_affiliation_string":"University of Central Florida, Orlando, FL, US","institution_ids":["https://openalex.org/I106165777"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5017485096","display_name":"Amro Awad","orcid":"https://orcid.org/0000-0003-3987-463X"},"institutions":[{"id":"https://openalex.org/I137902535","display_name":"North Carolina State University","ror":"https://ror.org/04tj63d06","country_code":"US","type":"education","lineage":["https://openalex.org/I137902535"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Amro Awad","raw_affiliation_strings":["North Carolina State University, Raleigh, NC, US"],"affiliations":[{"raw_affiliation_string":"North Carolina State University, Raleigh, NC, US","institution_ids":["https://openalex.org/I137902535"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5060908808","display_name":"Mingjie Lin","orcid":"https://orcid.org/0000-0002-3225-4406"},"institutions":[{"id":"https://openalex.org/I106165777","display_name":"University of Central Florida","ror":"https://ror.org/036nfer12","country_code":"US","type":"education","lineage":["https://openalex.org/I106165777"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Mingjie Lin","raw_affiliation_strings":["University of Central Florida, Orlando, FL, US"],"affiliations":[{"raw_affiliation_string":"University of Central Florida, Orlando, FL, US","institution_ids":["https://openalex.org/I106165777"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5090610227"],"corresponding_institution_ids":["https://openalex.org/I106165777"],"apc_list":null,"apc_paid":null,"fwci":0.8288,"has_fulltext":false,"cited_by_count":7,"citation_normalized_percentile":{"value":0.7269396,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":99},"biblio":{"volume":"21","issue":"1","first_page":"1","last_page":"24"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11181","display_name":"Advanced Data Storage Technologies","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11181","display_name":"Advanced Data Storage Technologies","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.9936000108718872,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10829","display_name":"Interconnection Networks and Systems","score":0.987500011920929,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8303791880607605},{"id":"https://openalex.org/keywords/operating-system","display_name":"Operating system","score":0.5957459211349487},{"id":"https://openalex.org/keywords/embedded-system","display_name":"Embedded system","score":0.533386766910553},{"id":"https://openalex.org/keywords/massively-parallel","display_name":"Massively parallel","score":0.43035706877708435},{"id":"https://openalex.org/keywords/scalability","display_name":"Scalability","score":0.4168754816055298}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8303791880607605},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.5957459211349487},{"id":"https://openalex.org/C149635348","wikidata":"https://www.wikidata.org/wiki/Q193040","display_name":"Embedded system","level":1,"score":0.533386766910553},{"id":"https://openalex.org/C190475519","wikidata":"https://www.wikidata.org/wiki/Q544384","display_name":"Massively parallel","level":2,"score":0.43035706877708435},{"id":"https://openalex.org/C48044578","wikidata":"https://www.wikidata.org/wiki/Q727490","display_name":"Scalability","level":2,"score":0.4168754816055298}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3463911","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3463911","pdf_url":null,"source":{"id":"https://openalex.org/S136160450","display_name":"ACM Transactions on Embedded Computing Systems","issn_l":"1539-9087","issn":["1539-9087","1558-3465"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319798","host_organization_name":"Association for Computing Machinery","host_organization_lineage":["https://openalex.org/P4310319798"],"host_organization_lineage_names":["Association for Computing Machinery"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ACM Transactions on Embedded Computing Systems","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[{"display_name":"Industry, innovation and infrastructure","score":0.4099999964237213,"id":"https://metadata.un.org/sdg/9"}],"awards":[],"funders":[{"id":"https://openalex.org/F4320332180","display_name":"Defense Advanced Research Projects Agency","ror":"https://ror.org/02caytj08"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":11,"referenced_works":["https://openalex.org/W1986470696","https://openalex.org/W1995277983","https://openalex.org/W2032801361","https://openalex.org/W2128757673","https://openalex.org/W2751343396","https://openalex.org/W2776946878","https://openalex.org/W2835033020","https://openalex.org/W2910146857","https://openalex.org/W2995244831","https://openalex.org/W3015040392","https://openalex.org/W4299654723"],"related_works":["https://openalex.org/W2461970972","https://openalex.org/W2364921833","https://openalex.org/W2388030554","https://openalex.org/W2302028273","https://openalex.org/W2117141678","https://openalex.org/W1525643724","https://openalex.org/W1572543472","https://openalex.org/W1595151633","https://openalex.org/W2053911416","https://openalex.org/W2357291590"],"abstract_inverted_index":{"With":[0],"data-intensive":[1],"artificial":[2],"intelligence":[3],"(AI)":[4],"and":[5,23,42,72,79,91,135,174,199,218,249,252,256,294,312,320,360,430,460,492],"machine":[6],"learning":[7],"(ML)":[8],"applications":[9,203,459,463],"rapidly":[10],"surging,":[11],"modern":[12,65,83,117],"high-performance":[13,118,148,198,285],"embedded":[14,119,149,416],"systems,":[15],"with":[16,37,290,437,477],"heterogeneous":[17],"computing":[18,150,177],"resources,":[19],"critically":[20],"demand":[21],"low-latency":[22],"high-bandwidth":[24],"data":[25,143,221],"communication.":[26],"As":[27],"such,":[28],"the":[29,62,96,102,147,158,166,183,208,224,231,263,277,309,327,338,368,381,453,485],"newly":[30],"emerging":[31],"NVMe":[32,66,103,113,133,142,167,210,392],"(Non-Volatile":[33],"Memory":[34],"Express)":[35],"protocol,":[36,104],"parallel":[38,89,160],"queuing,":[39],"access":[40,144,222],"prioritization,":[41],"optimized":[43,389],"I/O":[44,56,161,232,247,259,313,393,490,494],"arbitration,":[45],"starts":[46],"to":[47,69,109,115,127,140,156,179,182,262,353,356,362,426],"be":[48,70],"widely":[49],"adopted":[50],"as":[51],"a":[52,111,272,284,295,321,346,387,397,412,420,438,471,488],"de":[53],"facto":[54],"fast":[55],"communication":[57,233],"interface.":[58],"However,":[59],"effectively":[60],"leveraging":[61,171],"potential":[63],"of":[64,87,101,132,236,315,370,474],"storage":[67,134,168,202,310],"proves":[68],"nontrivial":[71],"demands":[73],"fine-grained":[74],"control,":[75],"high":[76],"processing":[77,90],"concurrency,":[78],"application-specific":[80,92,257],"optimization.":[81],"Fortunately,":[82],"FPGA":[84],"devices,":[85],"capable":[86],"efficient":[88],"programmability,":[93],"readily":[94],"meet":[95],"underlying":[97],"physical":[98],"layer":[99],"requirements":[100],"therefore":[105,213],"providing":[106,192],"unprecedented":[107],"opportunities":[108],"implementing":[110],"rich-featured":[112],"middleware":[114],"benefit":[116],"computing.":[120],"In":[121],"this":[122],"article,":[123],"we":[124,270,374,442,468],"present":[125],"how":[126],"rethink":[128],"existing":[129],"accessing":[130],"mechanisms":[131],"devise":[136],"innovative":[137],"hardware-assisted":[138],"solutions":[139],"accelerating":[141],"performance":[145,372,475,491],"for":[146,196,230],"system.":[151,400],"Our":[152,401],"key":[153],"idea":[154],"is":[155],"exploit":[157],"massively":[159],"queuing":[162,479],"capability,":[163],"provided":[164],"by":[165,435],"system,":[169],"through":[170,204],"FPGAs\u2019":[172],"reconfigurability":[173],"native":[175],"hardware":[176,194,229],"power":[178],"operate":[180],"transparently":[181],"main":[184],"processor.":[185],"Specifically,":[186,335],"our":[187,267,317,349,371,377,407,446],"DirectNVM":[188,274,318,350,378],"system":[189,275,292,319,324,379],"aims":[190],"at":[191],"effective":[193],"constructs":[195],"facilitating":[197],"scalable":[200],"userspace":[201,390],"(1)":[205],"hardening":[206],"all":[207],"essential":[209],"driver":[211,342],"functionalities,":[212],"avoiding":[214],"expensive":[215],"OS":[216],"syscalls":[217],"enabling":[219],"zero-copy":[220],"from":[223],"application,":[225],"(2)":[226],"relying":[227,237],"on":[228,238,345,396,411],"control":[234],"instead":[235],"OS-level":[239],"interrupts":[240],"that":[241,282,406,445,481],"can":[242,450,482],"significantly":[243,451],"reduce":[244],"both":[245,316],"total":[246],"latency":[248,314],"its":[250,302,493],"variance,":[251],"(3)":[253],"exposing":[254],"cutting-edge":[255],"weighted-round-robin":[258,448],"traffic":[260],"scheduling":[261,449],"userspace.":[264],"To":[265,366],"validate":[266],"design":[268],"methodology,":[269],"developed":[271,470],"complete":[273],"utilizing":[276],"Xilinx":[278],"Zynq":[279,347],"MPSoC":[280],"architecture":[281],"incorporates":[283],"application":[286],"processor":[287,418],"(APU)":[288],"equipped":[289],"DDR4":[291],"memory":[293],"hardened":[296],"configurable":[297],"PCIe":[298],"Gen3":[299],"block":[300],"in":[301,464],"programmable":[303],"logic":[304],"part.":[305],"We":[306],"then":[307],"measured":[308,376],"bandwidth":[311,454],"conventional":[322],"OS-based":[323],"when":[325],"executing":[326],"standard":[328],"FIO":[329],"benchmark":[330],"suite":[331],"[":[332,384],"2":[333],"].":[334],"compared":[336],"against":[337,380],"PetaLinux":[339],"built-in":[340],"kernel":[341],"code":[343],"running":[344,395,410],"MPSoC,":[348],"has":[351],"shown":[352,405],"achieve":[354],"up":[355,361,425],"18.4\u00d7":[357],"higher":[358,428],"throughput":[359,429],"4.5\u00d7":[363],"lower":[364,432],"latency.":[365,433],"ensure":[367],"fairness":[369],"comparison,":[373],"also":[375],"Intel":[382],"SPDK":[383],"26":[385],"],":[386],"highly":[388],"asynchronous":[391],"framework":[394,473],"X86":[398],"PC":[399],"experiment":[402],"results":[403],"have":[404,443,469],"DirectNVM,":[408],"even":[409],"considerably":[413],"less":[414],"powerful":[415],"ARM":[417],"than":[419],"full-scale":[421],"AMD":[422],"processor,":[423],"achieved":[424],"2.2\u00d7":[427],"1.3\u00d7":[431],"Furthermore,":[434],"experimenting":[436],"multi-threading":[439],"test":[440],"case,":[441],"demonstrated":[444],"DirectNVM\u2019s":[447],"optimize":[452],"allocation":[455],"between":[456,487],"latency-constraint":[457],"frontend":[458],"other":[461],"backend":[462],"real-time":[465],"systems.":[466],"Finally,":[467],"theoretical":[472],"modeling":[476],"classic":[478],"theory":[480],"quantitatively":[483],"define":[484],"relationship":[486],"system\u2019s":[489],"implementation.":[495]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":3},{"year":2024,"cited_by_count":2},{"year":2022,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
