{"id":"https://openalex.org/W4390962726","doi":"https://doi.org/10.48550/arxiv.2401.08138","title":"LLMs for Test Input Generation for Semantic Caches","display_name":"LLMs for Test Input Generation for Semantic Caches","publication_year":2024,"publication_date":"2024-01-16","ids":{"openalex":"https://openalex.org/W4390962726","doi":"https://doi.org/10.48550/arxiv.2401.08138"},"language":"en","primary_location":{"id":"pmh:oai:arXiv.org:2401.08138","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2401.08138","pdf_url":"https://arxiv.org/pdf/2401.08138","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"text"},"type":"preprint","indexed_in":["arxiv","datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2401.08138","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5088904375","display_name":"Zafaryab Rasool","orcid":"https://orcid.org/0000-0002-3603-3125"},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Rasool, Zafaryab","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5012088137","display_name":"Scott Barnett","orcid":"https://orcid.org/0000-0002-3187-4937"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Barnett, Scott","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5014718315","display_name":"David Willie","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Willie, David","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5080975739","display_name":"Stefanus Kurniawan","orcid":"https://orcid.org/0009-0001-4469-1056"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Kurniawan, Stefanus","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5093278278","display_name":"Sherwin Balugo","orcid":"https://orcid.org/0009-0001-5619-011X"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Balugo, Sherwin","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5070118830","display_name":"Srikanth Thudumu","orcid":"https://orcid.org/0000-0002-7848-9008"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Thudumu, Srikanth","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5068173669","display_name":"Mohamed Abdelrazek","orcid":"https://orcid.org/0000-0003-3812-9785"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Abdelrazek, Mohamed","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":7,"corresponding_author_ids":["https://openalex.org/A5088904375"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":true,"cited_by_count":1,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9990000128746033,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9990000128746033,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9916999936103821,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11719","display_name":"Data Quality and Management","score":0.951200008392334,"subfield":{"id":"https://openalex.org/subfields/1803","display_name":"Management Science and Operations Research"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8746283054351807},{"id":"https://openalex.org/keywords/cache","display_name":"Cache","score":0.7237743139266968},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.5482649207115173},{"id":"https://openalex.org/keywords/semantic-computing","display_name":"Semantic computing","score":0.5183945298194885},{"id":"https://openalex.org/keywords/semantic-similarity","display_name":"Semantic similarity","score":0.5100679993629456},{"id":"https://openalex.org/keywords/set","display_name":"Set (abstract data type)","score":0.4272944927215576},{"id":"https://openalex.org/keywords/semantic-web","display_name":"Semantic Web","score":0.22202172875404358},{"id":"https://openalex.org/keywords/programming-language","display_name":"Programming language","score":0.15163442492485046},{"id":"https://openalex.org/keywords/parallel-computing","display_name":"Parallel computing","score":0.0919128954410553}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8746283054351807},{"id":"https://openalex.org/C115537543","wikidata":"https://www.wikidata.org/wiki/Q165596","display_name":"Cache","level":2,"score":0.7237743139266968},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.5482649207115173},{"id":"https://openalex.org/C511149849","wikidata":"https://www.wikidata.org/wiki/Q7449051","display_name":"Semantic computing","level":3,"score":0.5183945298194885},{"id":"https://openalex.org/C130318100","wikidata":"https://www.wikidata.org/wiki/Q2268914","display_name":"Semantic similarity","level":2,"score":0.5100679993629456},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.4272944927215576},{"id":"https://openalex.org/C2129575","wikidata":"https://www.wikidata.org/wiki/Q54837","display_name":"Semantic Web","level":2,"score":0.22202172875404358},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.15163442492485046},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.0919128954410553}],"mesh":[],"locations_count":2,"locations":[{"id":"pmh:oai:arXiv.org:2401.08138","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2401.08138","pdf_url":"https://arxiv.org/pdf/2401.08138","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"text"},{"id":"doi:10.48550/arxiv.2401.08138","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2401.08138","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:2401.08138","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2401.08138","pdf_url":"https://arxiv.org/pdf/2401.08138","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"text"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":true,"grobid_xml":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4390962726.pdf","grobid_xml":"https://content.openalex.org/works/W4390962726.grobid-xml"},"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W1965623300","https://openalex.org/W3134365128","https://openalex.org/W2541135911","https://openalex.org/W2181757899","https://openalex.org/W2359259132","https://openalex.org/W4387489691","https://openalex.org/W2103835134","https://openalex.org/W3016822073","https://openalex.org/W2156467700","https://openalex.org/W2133831373"],"abstract_inverted_index":{"Large":[0],"language":[1],"models":[2,26],"(LLMs)":[3],"enable":[4],"state-of-the-art":[5],"semantic":[6,16,49,77,99,109,216,238,261,271],"capabilities":[7,160],"to":[8,11,53,57,72,163,167,174],"be":[9],"added":[10],"software":[12],"systems":[13],"such":[14],"as":[15],"search":[17],"of":[18,34,37,75,90,107,122,161,190,227,236],"unstructured":[19,151],"documents":[20],"and":[21,114,125,176,194,203,206,229,263],"text":[22,152],"generation.":[23],"However,":[24],"these":[25,76],"are":[27,51],"computationally":[28],"expensive.":[29],"At":[30],"scale,":[31],"the":[32,68,73,96,105,158,168,179,188],"cost":[33],"serving":[35],"thousands":[36],"users":[38],"increases":[39],"massively":[40],"affecting":[41],"also":[42,242],"user":[43,93],"experience.":[44],"To":[45],"address":[46],"this":[47,132],"problem,":[48],"caches":[50],"used":[52],"check":[54],"for":[55,139,142,260,266],"answers":[56],"similar":[58,123,148],"queries":[59,124,166,202],"(that":[60],"may":[61],"have":[62],"been":[63],"phrased":[64],"differently)":[65],"without":[66],"hitting":[67],"LLM":[69],"service.":[70],"Due":[71],"nature":[74],"cache":[78,100,110,112],"techniques":[79,101],"that":[80,146,221],"rely":[81],"on":[82,246],"query":[83,222],"embeddings,":[84],"there":[85],"is":[86,128,251],"a":[87,108,118,191,237,270],"high":[88],"chance":[89],"errors":[91],"impacting":[92],"confidence":[94],"in":[95,187],"system.":[97],"Adopting":[98],"usually":[102],"requires":[103,117],"testing":[104],"effectiveness":[106],"(accurate":[111],"hits":[113],"misses)":[115],"which":[116,127],"labelled":[119],"test":[120,143,181,257],"set":[121],"responses":[126],"often":[129],"unavailable.":[130],"In":[131],"paper,":[133],"we":[134,241],"present":[135],"VaryGen,":[136],"an":[137,208,213,252],"approach":[138,156,186,245],"using":[140],"LLMs":[141,162],"input":[144,258],"generation":[145,259],"produces":[147],"questions":[149],"from":[150],"documents.":[153],"Our":[154,218],"novel":[155],"uses":[157],"reasoning":[159],"1)":[164],"adapt":[165],"domain,":[169],"2)":[170],"synthesise":[171],"subtle":[172],"variations":[173],"queries,":[175],"3)":[177],"evaluate":[178,243],"synthesised":[180],"dataset.":[182,248],"We":[183],"evaluated":[184],"our":[185,230,244],"domain":[189],"student":[192],"question":[193],"answer":[195],"system":[196],"by":[197],"qualitatively":[198],"analysing":[199],"100":[200],"generated":[201,231],"result":[204],"pairs,":[205],"conducting":[207],"empirical":[209],"case":[210],"study":[211],"with":[212],"open":[214],"source":[215],"cache.":[217,239,272],"results":[219],"show":[220],"pairs":[223],"satisfy":[224],"human":[225],"expectations":[226],"similarity":[228],"data":[232],"demonstrates":[233],"failure":[234],"cases":[235],"Additionally,":[240],"Qasper":[247],"This":[249],"work":[250],"important":[253],"first":[254],"step":[255],"into":[256],"applications":[262],"presents":[264],"considerations":[265],"practitioners":[267],"when":[268],"calibrating":[269]},"counts_by_year":[{"year":2024,"cited_by_count":1}],"updated_date":"2026-03-13T16:22:10.518609","created_date":"2025-10-10T00:00:00"}
