{"id":"https://openalex.org/W4223941905","doi":"https://doi.org/10.1145/3505170.3506730","title":"Kernel Mapping Techniques for Deep Learning Neural Network Accelerators","display_name":"Kernel Mapping Techniques for Deep Learning Neural Network Accelerators","publication_year":2022,"publication_date":"2022-04-13","ids":{"openalex":"https://openalex.org/W4223941905","doi":"https://doi.org/10.1145/3505170.3506730"},"language":"en","primary_location":{"id":"doi:10.1145/3505170.3506730","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3505170.3506730","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2022 International Symposium on Physical Design","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5056919850","display_name":"Sarp \u00d6zdemir","orcid":"https://orcid.org/0000-0002-4212-7646"},"institutions":[{"id":"https://openalex.org/I123946342","display_name":"Binghamton University","ror":"https://ror.org/008rmbt77","country_code":"US","type":"education","lineage":["https://openalex.org/I123946342"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Sarp \u00d6zdemir","raw_affiliation_strings":["SUNY Binghamton, Binghamton, NY, USA"],"affiliations":[{"raw_affiliation_string":"SUNY Binghamton, Binghamton, NY, USA","institution_ids":["https://openalex.org/I123946342"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5023818218","display_name":"Mohammad T. Khasawneh","orcid":"https://orcid.org/0000-0002-4302-6943"},"institutions":[{"id":"https://openalex.org/I123946342","display_name":"Binghamton University","ror":"https://ror.org/008rmbt77","country_code":"US","type":"education","lineage":["https://openalex.org/I123946342"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Mohammad Khasawneh","raw_affiliation_strings":["SUNY Binghamton, Binghamton, NY, USA"],"affiliations":[{"raw_affiliation_string":"SUNY Binghamton, Binghamton, NY, USA","institution_ids":["https://openalex.org/I123946342"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5113986758","display_name":"Smriti S. Rao","orcid":null},"institutions":[{"id":"https://openalex.org/I123946342","display_name":"Binghamton University","ror":"https://ror.org/008rmbt77","country_code":"US","type":"education","lineage":["https://openalex.org/I123946342"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Smriti Rao","raw_affiliation_strings":["SUNY Binghamton, Binghamton, NY, USA"],"affiliations":[{"raw_affiliation_string":"SUNY Binghamton, Binghamton, NY, USA","institution_ids":["https://openalex.org/I123946342"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5074401951","display_name":"Patrick H. Madden","orcid":"https://orcid.org/0000-0002-1727-6885"},"institutions":[{"id":"https://openalex.org/I123946342","display_name":"Binghamton University","ror":"https://ror.org/008rmbt77","country_code":"US","type":"education","lineage":["https://openalex.org/I123946342"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Patrick H. Madden","raw_affiliation_strings":["SUNY Binghamton, Binghamton, NY, USA"],"affiliations":[{"raw_affiliation_string":"SUNY Binghamton, Binghamton, NY, USA","institution_ids":["https://openalex.org/I123946342"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5056919850"],"corresponding_institution_ids":["https://openalex.org/I123946342"],"apc_list":null,"apc_paid":null,"fwci":0.6991,"has_fulltext":false,"cited_by_count":5,"citation_normalized_percentile":{"value":0.65255157,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":100},"biblio":{"volume":null,"issue":null,"first_page":"21","last_page":"28"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.9995999932289124,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.9995999932289124,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10502","display_name":"Advanced Memory and Neural Computing","score":0.9994000196456909,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.9993000030517578,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8257633447647095},{"id":"https://openalex.org/keywords/kernel","display_name":"Kernel (algebra)","score":0.6804580092430115},{"id":"https://openalex.org/keywords/computer-architecture","display_name":"Computer architecture","score":0.6324790120124817},{"id":"https://openalex.org/keywords/deep-learning","display_name":"Deep learning","score":0.6173461675643921},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.6053698658943176},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.52999347448349},{"id":"https://openalex.org/keywords/variety","display_name":"Variety (cybernetics)","score":0.4841121435165405},{"id":"https://openalex.org/keywords/contest","display_name":"CONTEST","score":0.4785195589065552},{"id":"https://openalex.org/keywords/deep-neural-networks","display_name":"Deep neural networks","score":0.41391366720199585},{"id":"https://openalex.org/keywords/parallel-computing","display_name":"Parallel computing","score":0.40983033180236816},{"id":"https://openalex.org/keywords/computer-engineering","display_name":"Computer engineering","score":0.3983845114707947},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.3922906816005707}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8257633447647095},{"id":"https://openalex.org/C74193536","wikidata":"https://www.wikidata.org/wiki/Q574844","display_name":"Kernel (algebra)","level":2,"score":0.6804580092430115},{"id":"https://openalex.org/C118524514","wikidata":"https://www.wikidata.org/wiki/Q173212","display_name":"Computer architecture","level":1,"score":0.6324790120124817},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.6173461675643921},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.6053698658943176},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.52999347448349},{"id":"https://openalex.org/C136197465","wikidata":"https://www.wikidata.org/wiki/Q1729295","display_name":"Variety (cybernetics)","level":2,"score":0.4841121435165405},{"id":"https://openalex.org/C2777582232","wikidata":"https://www.wikidata.org/wiki/Q5013414","display_name":"CONTEST","level":2,"score":0.4785195589065552},{"id":"https://openalex.org/C2984842247","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep neural networks","level":3,"score":0.41391366720199585},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.40983033180236816},{"id":"https://openalex.org/C113775141","wikidata":"https://www.wikidata.org/wiki/Q428691","display_name":"Computer engineering","level":1,"score":0.3983845114707947},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.3922906816005707},{"id":"https://openalex.org/C114614502","wikidata":"https://www.wikidata.org/wiki/Q76592","display_name":"Combinatorics","level":1,"score":0.0},{"id":"https://openalex.org/C199539241","wikidata":"https://www.wikidata.org/wiki/Q7748","display_name":"Law","level":1,"score":0.0},{"id":"https://openalex.org/C17744445","wikidata":"https://www.wikidata.org/wiki/Q36442","display_name":"Political science","level":0,"score":0.0},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3505170.3506730","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3505170.3506730","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2022 International Symposium on Physical Design","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":14,"referenced_works":["https://openalex.org/W1686810756","https://openalex.org/W1970296212","https://openalex.org/W2025516544","https://openalex.org/W2050095818","https://openalex.org/W2115866417","https://openalex.org/W2119248453","https://openalex.org/W2128703518","https://openalex.org/W2963358710","https://openalex.org/W3004127905","https://openalex.org/W3012493694","https://openalex.org/W3112683606","https://openalex.org/W3136872908","https://openalex.org/W3203992401","https://openalex.org/W6680735601"],"related_works":["https://openalex.org/W2946214509","https://openalex.org/W2606108738","https://openalex.org/W4286740636","https://openalex.org/W2628063975","https://openalex.org/W2356479129","https://openalex.org/W2387346515","https://openalex.org/W2352196451","https://openalex.org/W2590086693","https://openalex.org/W2381260192","https://openalex.org/W3122423648"],"abstract_inverted_index":{"Deep":[0],"learning":[1,32],"applications":[2],"are":[3,110],"compute":[4,49],"intensive":[5],"and":[6,35,64],"naturally":[7],"parallel;":[8],"this":[9,24,42],"has":[10],"spurred":[11],"the":[12,20,80,88],"development":[13],"of":[14,84,90,93],"new":[15],"processor":[16],"architectures":[17],"tuned":[18],"for":[19,45],"work":[21],"load.":[22],"In":[23],"paper,":[25],"we":[26],"consider":[27],"structural":[28],"differences":[29],"between":[30],"deep":[31],"neural":[33,47],"networks":[34],"more":[36],"conventional":[37],"circuits":[38],"--":[39],"highlighting":[40],"how":[41],"impacts":[43],"strategies":[44],"mapping":[46,58],"network":[48],"kernels":[50],"onto":[51],"available":[52],"hardware.":[53],"We":[54,72],"present":[55],"an":[56,75],"efficient":[57],"approach":[59,77],"based":[60],"on":[61],"dynamic":[62],"programming,":[63],"also":[65,73,111],"a":[66,91,97,106],"method":[67],"to":[68,78],"establish":[69],"performance":[70,99],"bounds.":[71],"propose":[74],"architectural":[76],"extend":[79],"practical":[81],"life":[82],"time":[83],"hardware":[85],"accelerators,":[86],"enabling":[87],"integration":[89],"variety":[92],"heterogenous":[94],"processors":[95],"into":[96],"high":[98],"system.":[100],"Experimental":[101],"results":[102],"using":[103],"benchmarks":[104],"from":[105],"recent":[107],"ISPD":[108],"contest":[109],"reported.":[112]},"counts_by_year":[{"year":2026,"cited_by_count":2},{"year":2025,"cited_by_count":2},{"year":2024,"cited_by_count":1}],"updated_date":"2026-03-06T13:50:29.536080","created_date":"2025-10-10T00:00:00"}
