{"id":"https://openalex.org/W2794613042","doi":"https://doi.org/10.1109/dasc-picom-datacom-cyberscitec.2017.204","title":"Building a Semi-Supervised Dataset to Train Journalistic Relevance Detection Models","display_name":"Building a Semi-Supervised Dataset to Train Journalistic Relevance Detection Models","publication_year":2017,"publication_date":"2017-11-01","ids":{"openalex":"https://openalex.org/W2794613042","doi":"https://doi.org/10.1109/dasc-picom-datacom-cyberscitec.2017.204","mag":"2794613042"},"language":"en","primary_location":{"id":"doi:10.1109/dasc-picom-datacom-cyberscitec.2017.204","is_oa":false,"landing_page_url":"https://doi.org/10.1109/dasc-picom-datacom-cyberscitec.2017.204","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2017 IEEE 15th Intl Conf on Dependable, Autonomic and Secure Computing, 15th Intl Conf on Pervasive Intelligence and Computing, 3rd Intl Conf on Big Data Intelligence and Computing and Cyber Science and Technology Congress(DASC/PiCom/DataCom/CyberSciTech)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5016762476","display_name":"Nuno Guimar\ufffd\u00e3es","orcid":"https://orcid.org/0000-0003-2854-2891"},"institutions":[{"id":"https://openalex.org/I182534213","display_name":"Universidade do Porto","ror":"https://ror.org/043pwc612","country_code":"PT","type":"education","lineage":["https://openalex.org/I182534213"]}],"countries":["PT"],"is_corresponding":true,"raw_author_name":"Nuno Ricardo Pinheiro da Silva Guimaraes","raw_affiliation_strings":["CRACS, Univ. of Porto, Porto, Portugal"],"affiliations":[{"raw_affiliation_string":"CRACS, Univ. of Porto, Porto, Portugal","institution_ids":["https://openalex.org/I182534213"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5029477501","display_name":"\u00c1lvaro Figueira","orcid":"https://orcid.org/0000-0002-0507-7504"},"institutions":[{"id":"https://openalex.org/I182534213","display_name":"Universidade do Porto","ror":"https://ror.org/043pwc612","country_code":"PT","type":"education","lineage":["https://openalex.org/I182534213"]}],"countries":["PT"],"is_corresponding":false,"raw_author_name":"Alvaro Pedro de Barros Borges Reis Figueira","raw_affiliation_strings":["CRACS, Univ. of Porto, Porto, Portugal"],"affiliations":[{"raw_affiliation_string":"CRACS, Univ. of Porto, Porto, Portugal","institution_ids":["https://openalex.org/I182534213"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5016762476"],"corresponding_institution_ids":["https://openalex.org/I182534213"],"apc_list":null,"apc_paid":null,"fwci":0.39,"has_fulltext":false,"cited_by_count":2,"citation_normalized_percentile":{"value":0.72844517,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":94},"biblio":{"volume":"13","issue":null,"first_page":"1271","last_page":"1277"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10664","display_name":"Sentiment Analysis and Opinion Mining","score":0.9995999932289124,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10664","display_name":"Sentiment Analysis and Opinion Mining","score":0.9995999932289124,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9994999766349792,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11550","display_name":"Text and Document Classification Technologies","score":0.9984999895095825,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8516746163368225},{"id":"https://openalex.org/keywords/relevance","display_name":"Relevance (law)","score":0.8332012891769409},{"id":"https://openalex.org/keywords/crowdsourcing","display_name":"Crowdsourcing","score":0.8237757682800293},{"id":"https://openalex.org/keywords/predictability","display_name":"Predictability","score":0.6832711100578308},{"id":"https://openalex.org/keywords/social-media","display_name":"Social media","score":0.645282506942749},{"id":"https://openalex.org/keywords/reliability","display_name":"Reliability (semiconductor)","score":0.5853951573371887},{"id":"https://openalex.org/keywords/scope","display_name":"Scope (computer science)","score":0.5491707921028137},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.4597172737121582},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.4065064787864685},{"id":"https://openalex.org/keywords/data-science","display_name":"Data science","score":0.40160438418388367},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.395719438791275},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.3434690535068512},{"id":"https://openalex.org/keywords/world-wide-web","display_name":"World Wide Web","score":0.17304477095603943}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8516746163368225},{"id":"https://openalex.org/C158154518","wikidata":"https://www.wikidata.org/wiki/Q7310970","display_name":"Relevance (law)","level":2,"score":0.8332012891769409},{"id":"https://openalex.org/C62230096","wikidata":"https://www.wikidata.org/wiki/Q275969","display_name":"Crowdsourcing","level":2,"score":0.8237757682800293},{"id":"https://openalex.org/C197640229","wikidata":"https://www.wikidata.org/wiki/Q2534066","display_name":"Predictability","level":2,"score":0.6832711100578308},{"id":"https://openalex.org/C518677369","wikidata":"https://www.wikidata.org/wiki/Q202833","display_name":"Social media","level":2,"score":0.645282506942749},{"id":"https://openalex.org/C43214815","wikidata":"https://www.wikidata.org/wiki/Q7310987","display_name":"Reliability (semiconductor)","level":3,"score":0.5853951573371887},{"id":"https://openalex.org/C2778012447","wikidata":"https://www.wikidata.org/wiki/Q1034415","display_name":"Scope (computer science)","level":2,"score":0.5491707921028137},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.4597172737121582},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.4065064787864685},{"id":"https://openalex.org/C2522767166","wikidata":"https://www.wikidata.org/wiki/Q2374463","display_name":"Data science","level":1,"score":0.40160438418388367},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.395719438791275},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.3434690535068512},{"id":"https://openalex.org/C136764020","wikidata":"https://www.wikidata.org/wiki/Q466","display_name":"World Wide Web","level":1,"score":0.17304477095603943},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0},{"id":"https://openalex.org/C163258240","wikidata":"https://www.wikidata.org/wiki/Q25342","display_name":"Power (physics)","level":2,"score":0.0},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0},{"id":"https://openalex.org/C199539241","wikidata":"https://www.wikidata.org/wiki/Q7748","display_name":"Law","level":1,"score":0.0},{"id":"https://openalex.org/C17744445","wikidata":"https://www.wikidata.org/wiki/Q36442","display_name":"Political science","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/dasc-picom-datacom-cyberscitec.2017.204","is_oa":false,"landing_page_url":"https://doi.org/10.1109/dasc-picom-datacom-cyberscitec.2017.204","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2017 IEEE 15th Intl Conf on Dependable, Autonomic and Secure Computing, 15th Intl Conf on Pervasive Intelligence and Computing, 3rd Intl Conf on Big Data Intelligence and Computing and Cyber Science and Technology Congress(DASC/PiCom/DataCom/CyberSciTech)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[{"id":"https://openalex.org/F4320334779","display_name":"Funda\u00e7\u00e3o para a Ci\u00eancia e a Tecnologia","ror":"https://ror.org/00snfqn58"},{"id":"https://openalex.org/F4320335322","display_name":"European Regional Development Fund","ror":"https://ror.org/00k4n6c32"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":39,"referenced_works":["https://openalex.org/W980795213","https://openalex.org/W1503130737","https://openalex.org/W1527789501","https://openalex.org/W1614298861","https://openalex.org/W1684832230","https://openalex.org/W1826790618","https://openalex.org/W1987425720","https://openalex.org/W2008285050","https://openalex.org/W2050619059","https://openalex.org/W2052635433","https://openalex.org/W2064178288","https://openalex.org/W2099813784","https://openalex.org/W2111975591","https://openalex.org/W2124060136","https://openalex.org/W2124499489","https://openalex.org/W2132232498","https://openalex.org/W2139188905","https://openalex.org/W2160660844","https://openalex.org/W2162010436","https://openalex.org/W2164124780","https://openalex.org/W2165571577","https://openalex.org/W2168400688","https://openalex.org/W2294703018","https://openalex.org/W2296734373","https://openalex.org/W2331992878","https://openalex.org/W2471350540","https://openalex.org/W2558476596","https://openalex.org/W2596622777","https://openalex.org/W2769002535","https://openalex.org/W3105915590","https://openalex.org/W3122583626","https://openalex.org/W6629970107","https://openalex.org/W6636510571","https://openalex.org/W6637433751","https://openalex.org/W6676744775","https://openalex.org/W6683937847","https://openalex.org/W6684191474","https://openalex.org/W6697146284","https://openalex.org/W6697591862"],"related_works":["https://openalex.org/W3032998312","https://openalex.org/W135177976","https://openalex.org/W4384486036","https://openalex.org/W1503094549","https://openalex.org/W2337920774","https://openalex.org/W4286908577","https://openalex.org/W2886410948","https://openalex.org/W1497983610","https://openalex.org/W1980158193","https://openalex.org/W2917701982"],"abstract_inverted_index":{"Annotated":[0],"data":[1,21],"is":[2,22,65,111,167,188],"one":[3],"of":[4,17,50,57,72,83,104,116,176,217],"the":[5,15,18,54,69,81,101,114,117,125,142,161,174,177,215,218],"most":[6],"important":[7],"components":[8],"for":[9],"supervised":[10],"learning":[11],"tasks.":[12],"To":[13],"ensure":[14],"reliability":[16],"models,":[19,132],"this":[20],"usually":[23],"labeled":[24],"by":[25,191],"several":[26],"human":[27],"annotators":[28],"through":[29,145],"volunteering":[30],"or":[31],"using":[32],"Crowdsourcing":[33],"platforms.":[34],"However,":[35,172],"such":[36],"approaches":[37],"are":[38,182],"unfeasible":[39],"(regarding":[40],"time":[41,207],"and":[42,128,136,155,197,209],"cost)":[43],"in":[44,53,61,119,160],"datasets":[45],"with":[46,80,151],"an":[47,91],"enormous":[48],"number":[49],"entries,":[51],"which":[52,166],"specific":[55,206,210],"case":[56],"journalistic":[58,102],"relevance":[59,86,103,130],"detection":[60,87,131],"social":[62,195],"media":[63],"posts,":[64],"necessary":[66],"due":[67],"to":[68,93,204],"wide":[70],"scope":[71],"topics":[73],"that":[74],"can":[75,213],"be":[76],"considered":[77],"relevant.":[78],"Therefore,":[79],"goal":[82],"building":[84],"a":[85,95,146,205],"model,":[88],"we":[89,123,140],"propose":[90],"architecture":[92],"build":[94,129],"large":[96],"scale":[97],"annotated":[98,149],"dataset":[99,127,150,163,201],"regarding":[100],"Twitter":[105,120],"posts":[106,152],"(i.e.":[107],"tweets).":[108],"This":[109],"methodology":[110],"based":[112],"on":[113],"predictability":[115],"content":[118,192],"accounts.":[121],"Next,":[122],"used":[124],"retrieved":[126],"combining":[133],"text,":[134],"entities,":[135],"sentiment":[137],"features.":[138],"Finally,":[139],"validated":[141],"best":[143],"model":[144,187],"smaller":[147],"manually":[148],"from":[153,170,193],"Facebook":[154],"Twitter.":[156],"The":[157],"F1-measure":[158],"achieved":[159],"validation":[162,178,200],"was":[164,202],"63%":[165],"still":[168],"far":[169],"excellent.":[171],"given":[173],"characteristics":[175],"data,":[179],"these":[180],"results":[181],"encouraging":[183],"since":[184],"1)":[185],"our":[186,199],"not":[189],"affected":[190],"other":[194],"networks":[196],"2)":[198],"restrained":[203],"interval":[208],"keywords":[211],"(which":[212],"affect":[214],"performance":[216],"model).":[219]},"counts_by_year":[{"year":2020,"cited_by_count":1},{"year":2019,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
