{"id":"https://openalex.org/W4224136636","doi":"https://doi.org/10.48550/arxiv.2204.06546","title":"Disentangling Uncertainty in Machine Translation Evaluation","display_name":"Disentangling Uncertainty in Machine Translation Evaluation","publication_year":2022,"publication_date":"2022-04-13","ids":{"openalex":"https://openalex.org/W4224136636","doi":"https://doi.org/10.48550/arxiv.2204.06546"},"language":"en","primary_location":{"id":"pmh:oai:arXiv.org:2204.06546","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2204.06546","pdf_url":"https://arxiv.org/pdf/2204.06546","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"text"},"type":"preprint","indexed_in":["arxiv","datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2204.06546","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5004372721","display_name":"Chrysoula Zerva","orcid":"https://orcid.org/0000-0002-4031-9492"},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Zerva, Chrysoula","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5017626161","display_name":"Taisiya Glushkova","orcid":"https://orcid.org/0000-0003-3521-3834"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Glushkova, Taisiya","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5039347839","display_name":"Ricardo Rei","orcid":"https://orcid.org/0000-0001-8265-1939"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Rei, Ricardo","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5051693368","display_name":"Andr\u00e9 F. T. Martins","orcid":"https://orcid.org/0000-0001-8282-625X"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Martins, Andr\u00e9 F. T.","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5004372721"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9927999973297119,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9927999973297119,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9848999977111816,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12026","display_name":"Explainable Artificial Intelligence (XAI)","score":0.9704999923706055,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6979345083236694},{"id":"https://openalex.org/keywords/uncertainty-quantification","display_name":"Uncertainty quantification","score":0.6592406034469604},{"id":"https://openalex.org/keywords/metric","display_name":"Metric (unit)","score":0.64680016040802},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.6063976287841797},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5728852152824402},{"id":"https://openalex.org/keywords/uncertainty-reduction-theory","display_name":"Uncertainty reduction theory","score":0.5156325101852417},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.49401789903640747},{"id":"https://openalex.org/keywords/machine-translation","display_name":"Machine translation","score":0.48925137519836426},{"id":"https://openalex.org/keywords/divergence","display_name":"Divergence (linguistics)","score":0.4760434627532959},{"id":"https://openalex.org/keywords/monte-carlo-method","display_name":"Monte Carlo method","score":0.440281480550766},{"id":"https://openalex.org/keywords/regression","display_name":"Regression","score":0.43374955654144287},{"id":"https://openalex.org/keywords/heteroscedasticity","display_name":"Heteroscedasticity","score":0.41594451665878296},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.34869325160980225},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.13981059193611145},{"id":"https://openalex.org/keywords/statistics","display_name":"Statistics","score":0.13227257132530212}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6979345083236694},{"id":"https://openalex.org/C32230216","wikidata":"https://www.wikidata.org/wiki/Q7882499","display_name":"Uncertainty quantification","level":2,"score":0.6592406034469604},{"id":"https://openalex.org/C176217482","wikidata":"https://www.wikidata.org/wiki/Q860554","display_name":"Metric (unit)","level":2,"score":0.64680016040802},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.6063976287841797},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5728852152824402},{"id":"https://openalex.org/C94361409","wikidata":"https://www.wikidata.org/wiki/Q7882500","display_name":"Uncertainty reduction theory","level":2,"score":0.5156325101852417},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.49401789903640747},{"id":"https://openalex.org/C203005215","wikidata":"https://www.wikidata.org/wiki/Q79798","display_name":"Machine translation","level":2,"score":0.48925137519836426},{"id":"https://openalex.org/C207390915","wikidata":"https://www.wikidata.org/wiki/Q1230525","display_name":"Divergence (linguistics)","level":2,"score":0.4760434627532959},{"id":"https://openalex.org/C19499675","wikidata":"https://www.wikidata.org/wiki/Q232207","display_name":"Monte Carlo method","level":2,"score":0.440281480550766},{"id":"https://openalex.org/C83546350","wikidata":"https://www.wikidata.org/wiki/Q1139051","display_name":"Regression","level":2,"score":0.43374955654144287},{"id":"https://openalex.org/C101104100","wikidata":"https://www.wikidata.org/wiki/Q1063540","display_name":"Heteroscedasticity","level":2,"score":0.41594451665878296},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.34869325160980225},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.13981059193611145},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.13227257132530212},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.0},{"id":"https://openalex.org/C46312422","wikidata":"https://www.wikidata.org/wiki/Q11024","display_name":"Communication","level":1,"score":0.0},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C187736073","wikidata":"https://www.wikidata.org/wiki/Q2920921","display_name":"Management","level":1,"score":0.0},{"id":"https://openalex.org/C21547014","wikidata":"https://www.wikidata.org/wiki/Q1423657","display_name":"Operations management","level":1,"score":0.0},{"id":"https://openalex.org/C144024400","wikidata":"https://www.wikidata.org/wiki/Q21201","display_name":"Sociology","level":0,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"pmh:oai:arXiv.org:2204.06546","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2204.06546","pdf_url":"https://arxiv.org/pdf/2204.06546","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"text"},{"id":"doi:10.48550/arxiv.2204.06546","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2204.06546","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:2204.06546","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2204.06546","pdf_url":"https://arxiv.org/pdf/2204.06546","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"text"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W2224641141","https://openalex.org/W2115703496","https://openalex.org/W2953569485","https://openalex.org/W2797314510","https://openalex.org/W2513379397","https://openalex.org/W3196464345","https://openalex.org/W2149758120","https://openalex.org/W2486383940","https://openalex.org/W171701494","https://openalex.org/W2996869126"],"abstract_inverted_index":{"Trainable":[0],"evaluation":[1],"metrics":[2,148],"for":[3,60,90,116,145],"machine":[4],"translation":[5],"(MT)":[6],"exhibit":[7],"strong":[8],"correlation":[9],"with":[10,37,123,151],"human":[11],"judgements,":[12],"but":[13],"they":[14,62,73,159],"are":[15,54,63,74],"often":[16],"hard":[17],"to":[18,34,65,98,120,166],"interpret":[19],"and":[20,45,72,76,86,93,104,112,133,179],"might":[21],"produce":[22],"unreliable":[23],"scores":[24],"under":[25],"noisy":[26],"or":[27],"out-of-domain":[28,180],"data.":[29,181],"Recent":[30],"work":[31],"has":[32],"attempted":[33],"mitigate":[35],"this":[36,80,108],"simple":[38],"uncertainty":[39,88,125,135,143,169],"quantification":[40],"techniques":[41,50],"(Monte":[42],"Carlo":[43],"dropout":[44],"deep":[46],"ensembles),":[47],"however":[48],"these":[49,164],"(as":[51],"we":[52,82,94,110],"show)":[53],"limited":[55],"in":[56,155,171],"several":[57],"ways":[58],"--":[59],"example,":[61],"unable":[64],"distinguish":[66],"between":[67],"different":[68,100],"kinds":[69],"of":[70,102,163],"uncertainty,":[71],"time":[75],"memory":[77],"consuming.":[78],"In":[79],"paper,":[81],"propose":[83],"more":[84],"powerful":[85],"efficient":[87],"predictors":[89,165],"MT":[91,172],"evaluation,":[92,173],"assess":[95],"their":[96],"ability":[97,162],"target":[99],"sources":[101],"aleatoric":[103],"epistemic":[105],"uncertainty.":[106],"To":[107],"end,":[109],"develop":[111],"compare":[113],"training":[114],"objectives":[115],"the":[117,146,161],"COMET":[118],"metric":[119],"enhance":[121],"it":[122],"an":[124],"prediction":[126,144],"output,":[127],"including":[128],"heteroscedastic":[129],"regression,":[130],"divergence":[131],"minimization,":[132],"direct":[134],"prediction.":[136],"Our":[137],"experiments":[138],"show":[139],"improved":[140],"results":[141],"on":[142],"WMT":[147],"task":[149],"datasets,":[150],"a":[152],"substantial":[153],"reduction":[154],"computational":[156],"costs.":[157],"Moreover,":[158],"demonstrate":[160],"address":[167],"specific":[168],"causes":[170],"such":[174],"as":[175],"low":[176],"quality":[177],"references":[178]},"counts_by_year":[],"updated_date":"2026-02-09T09:26:11.010843","created_date":"2025-10-10T00:00:00"}
