{"id":"https://openalex.org/W2406078291","doi":"https://doi.org/10.21437/interspeech.2012-599","title":"KNNDIST: a non-parametric distance measure for speaker segmentation","display_name":"KNNDIST: a non-parametric distance measure for speaker segmentation","publication_year":2012,"publication_date":"2012-09-09","ids":{"openalex":"https://openalex.org/W2406078291","doi":"https://doi.org/10.21437/interspeech.2012-599","mag":"2406078291"},"language":"en","primary_location":{"id":"doi:10.21437/interspeech.2012-599","is_oa":false,"landing_page_url":"https://doi.org/10.21437/interspeech.2012-599","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Interspeech 2012","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5014830287","display_name":"Seyed Hamidreza Mohammadi","orcid":"https://orcid.org/0000-0002-6892-9241"},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Seyed Hamidreza Mohammadi","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5024773257","display_name":"Hossein Sameti","orcid":"https://orcid.org/0000-0002-8087-8889"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Hossein Sameti","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5070345621","display_name":"Mahsa Sadat Elyasi Langarani","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Mahsa Sadat Elyasi Langarani","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5065400728","display_name":"Amirhossein Tavanaei","orcid":"https://orcid.org/0000-0002-6482-440X"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Amirhossein Tavanaei","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5014830287"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.2477,"has_fulltext":false,"cited_by_count":2,"citation_normalized_percentile":{"value":0.6150736,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":94},"biblio":{"volume":null,"issue":null,"first_page":"2282","last_page":"2285"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9991000294685364,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":0.9990000128746033,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/segmentation","display_name":"Segmentation","score":0.6851659417152405},{"id":"https://openalex.org/keywords/distance-measures","display_name":"Distance measures","score":0.6689081192016602},{"id":"https://openalex.org/keywords/measure","display_name":"Measure (data warehouse)","score":0.6602094173431396},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.5830737352371216},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.5460262298583984},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5454273223876953},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.5400558114051819},{"id":"https://openalex.org/keywords/preprocessor","display_name":"Preprocessor","score":0.4563068449497223},{"id":"https://openalex.org/keywords/minimum-distance","display_name":"Minimum distance","score":0.42086061835289},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.3286032974720001},{"id":"https://openalex.org/keywords/statistics","display_name":"Statistics","score":0.17622491717338562},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.0798804759979248}],"concepts":[{"id":"https://openalex.org/C89600930","wikidata":"https://www.wikidata.org/wiki/Q1423946","display_name":"Segmentation","level":2,"score":0.6851659417152405},{"id":"https://openalex.org/C2639959","wikidata":"https://www.wikidata.org/wiki/Q1344778","display_name":"Distance measures","level":2,"score":0.6689081192016602},{"id":"https://openalex.org/C2780009758","wikidata":"https://www.wikidata.org/wiki/Q6804172","display_name":"Measure (data warehouse)","level":2,"score":0.6602094173431396},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5830737352371216},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.5460262298583984},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5454273223876953},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.5400558114051819},{"id":"https://openalex.org/C34736171","wikidata":"https://www.wikidata.org/wiki/Q918333","display_name":"Preprocessor","level":2,"score":0.4563068449497223},{"id":"https://openalex.org/C3018063660","wikidata":"https://www.wikidata.org/wiki/Q6865448","display_name":"Minimum distance","level":2,"score":0.42086061835289},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.3286032974720001},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.17622491717338562},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.0798804759979248}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.21437/interspeech.2012-599","is_oa":false,"landing_page_url":"https://doi.org/10.21437/interspeech.2012-599","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Interspeech 2012","raw_type":"proceedings-article"},{"id":"pmh:oai:CiteSeerX.psu:10.1.1.303.3088","is_oa":false,"landing_page_url":"http://citeseerx.ist.psu.edu/viewdoc/summary?doi=10.1.1.303.3088","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"http://www.cslu.ogi.edu/~mohammah/seyed-hamidreza-mohammadi-2012-knndist-nonparametric-speaker-segmentation-distance-measure.pdf","raw_type":"text"}],"best_oa_location":null,"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/4","score":0.41999998688697815,"display_name":"Quality Education"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":9,"referenced_works":["https://openalex.org/W1482605500","https://openalex.org/W1484181928","https://openalex.org/W1876378865","https://openalex.org/W2029687556","https://openalex.org/W2044591814","https://openalex.org/W2104353650","https://openalex.org/W2151299225","https://openalex.org/W2162627003","https://openalex.org/W2166980079"],"related_works":["https://openalex.org/W2990913351","https://openalex.org/W2041294799","https://openalex.org/W2393169369","https://openalex.org/W4320061370","https://openalex.org/W1571567067","https://openalex.org/W1563946824","https://openalex.org/W4294624291","https://openalex.org/W4393210033","https://openalex.org/W4294811698","https://openalex.org/W2768813365"],"abstract_inverted_index":{"A":[0],"novel":[1],"distance":[2,11,19,35,42,48,106,118],"measure":[3,12,43,107],"for":[4,110],"distance-based":[5],"speaker":[6,23,116],"segmentation":[7,24,60],"is":[8,13,44,56,62,83,108],"proposed.":[9,58],"This":[10,41],"nonparametric,":[14],"in":[15,22,53,92],"contrast":[16],"to":[17],"common":[18],"measures":[20],"used":[21],"systems,":[25],"which":[26],"often":[27],"assume":[28],"a":[29,46,90],"Gaussian":[30],"distribution":[31],"when":[32],"measuring":[33],"the":[34,69,105],"between":[36],"1":[37],"two":[38,73],"audio":[39],"segments.":[40],"essentially":[45],"k-nearestneighbor":[47],"measure.":[49],"Non-vowel":[50],"segment":[51],"removal":[52],"preprocessing":[54],"stage":[55],"also":[57],"Speaker":[59],"performance":[61],"tested":[63],"on":[64],"artificially":[65],"created":[66],"conversations":[67],"from":[68],"TIMIT":[70],"database":[71],"and":[72,96],"AMI":[74],"conversations.":[75],"For":[76,86],"short":[77],"window":[78,88,112],"lengths,":[79,89],"Missed":[80,94],"Detection":[81,95],"Rated":[82],"decreased":[84],"significantly.":[85],"moderate":[87],"decrease":[91],"both":[93],"False":[97],"Alarm":[98],"Rates":[99],"occur.":[100],"The":[101],"computational":[102],"cost":[103],"of":[104],"high":[109],"long":[111],"lengths.":[113],"Index":[114],"Terms:":[115],"segmentation,":[117],"measure,":[119],"k-nearest-neighbor":[120]},"counts_by_year":[{"year":2018,"cited_by_count":1},{"year":2014,"cited_by_count":1}],"updated_date":"2026-04-05T17:49:38.594831","created_date":"2025-10-10T00:00:00"}
