{"id":"https://openalex.org/W2176067516","doi":"https://doi.org/10.1109/hpcc-css-icess.2015.170","title":"Predicting Scheduling Failures in the Cloud: A Case Study with Google Clusters and Hadoop on Amazon EMR","display_name":"Predicting Scheduling Failures in the Cloud: A Case Study with Google Clusters and Hadoop on Amazon EMR","publication_year":2015,"publication_date":"2015-08-01","ids":{"openalex":"https://openalex.org/W2176067516","doi":"https://doi.org/10.1109/hpcc-css-icess.2015.170","mag":"2176067516"},"language":"en","primary_location":{"id":"doi:10.1109/hpcc-css-icess.2015.170","is_oa":false,"landing_page_url":"https://doi.org/10.1109/hpcc-css-icess.2015.170","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2015 IEEE 17th International Conference on High Performance Computing and Communications, 2015 IEEE 7th International Symposium on Cyberspace Safety and Security, and 2015 IEEE 12th International Conference on Embedded Software and Systems","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5060591766","display_name":"Mbarka Soualhia","orcid":"https://orcid.org/0000-0003-3500-6720"},"institutions":[{"id":"https://openalex.org/I60158472","display_name":"Concordia University","ror":"https://ror.org/0420zvk78","country_code":"CA","type":"education","lineage":["https://openalex.org/I60158472"]}],"countries":["CA"],"is_corresponding":true,"raw_author_name":"Mbarka Soualhia","raw_affiliation_strings":["Concordia University"],"affiliations":[{"raw_affiliation_string":"Concordia University","institution_ids":["https://openalex.org/I60158472"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5071052367","display_name":"Foutse Khomh","orcid":"https://orcid.org/0000-0002-5704-4173"},"institutions":[{"id":"https://openalex.org/I45683168","display_name":"Polytechnique Montr\u00e9al","ror":"https://ror.org/05f8d4e86","country_code":"CA","type":"education","lineage":["https://openalex.org/I45683168"]}],"countries":["CA"],"is_corresponding":false,"raw_author_name":"Foutse Khomh","raw_affiliation_strings":["Polytechnique Montr\u00e9al, Montr\u00e9al, Quebec, Canada"],"affiliations":[{"raw_affiliation_string":"Polytechnique Montr\u00e9al, Montr\u00e9al, Quebec, Canada","institution_ids":["https://openalex.org/I45683168"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5007159598","display_name":"Sofi\u00e8ne Tahar","orcid":"https://orcid.org/0000-0002-5537-104X"},"institutions":[{"id":"https://openalex.org/I60158472","display_name":"Concordia University","ror":"https://ror.org/0420zvk78","country_code":"CA","type":"education","lineage":["https://openalex.org/I60158472"]}],"countries":["CA"],"is_corresponding":false,"raw_author_name":"Sofiene Tahar","raw_affiliation_strings":["Concordia University"],"affiliations":[{"raw_affiliation_string":"Concordia University","institution_ids":["https://openalex.org/I60158472"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5060591766"],"corresponding_institution_ids":["https://openalex.org/I60158472"],"apc_list":null,"apc_paid":null,"fwci":4.9777,"has_fulltext":false,"cited_by_count":29,"citation_normalized_percentile":{"value":0.95342992,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":89,"max":99},"biblio":{"volume":null,"issue":null,"first_page":"58","last_page":"65"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10101","display_name":"Cloud Computing and Resource Management","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10101","display_name":"Cloud Computing and Resource Management","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10273","display_name":"IoT and Edge/Fog Computing","score":0.9977999925613403,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12761","display_name":"Data Stream Mining Techniques","score":0.9828000068664551,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/cloud-computing","display_name":"Cloud computing","score":0.8834206461906433},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8564473390579224},{"id":"https://openalex.org/keywords/turnaround-time","display_name":"Turnaround time","score":0.6813657879829407},{"id":"https://openalex.org/keywords/scheduling","display_name":"Scheduling (production processes)","score":0.6309005618095398},{"id":"https://openalex.org/keywords/execution-time","display_name":"Execution time","score":0.5997516512870789},{"id":"https://openalex.org/keywords/distributed-computing","display_name":"Distributed computing","score":0.5537883043289185},{"id":"https://openalex.org/keywords/big-data","display_name":"Big data","score":0.5460673570632935},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.4713522791862488},{"id":"https://openalex.org/keywords/the-internet","display_name":"The Internet","score":0.42473095655441284},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.3219665288925171},{"id":"https://openalex.org/keywords/operating-system","display_name":"Operating system","score":0.2185879349708557}],"concepts":[{"id":"https://openalex.org/C79974875","wikidata":"https://www.wikidata.org/wiki/Q483639","display_name":"Cloud computing","level":2,"score":0.8834206461906433},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8564473390579224},{"id":"https://openalex.org/C176553487","wikidata":"https://www.wikidata.org/wiki/Q7855819","display_name":"Turnaround time","level":2,"score":0.6813657879829407},{"id":"https://openalex.org/C206729178","wikidata":"https://www.wikidata.org/wiki/Q2271896","display_name":"Scheduling (production processes)","level":2,"score":0.6309005618095398},{"id":"https://openalex.org/C2989134064","wikidata":"https://www.wikidata.org/wiki/Q288510","display_name":"Execution time","level":2,"score":0.5997516512870789},{"id":"https://openalex.org/C120314980","wikidata":"https://www.wikidata.org/wiki/Q180634","display_name":"Distributed computing","level":1,"score":0.5537883043289185},{"id":"https://openalex.org/C75684735","wikidata":"https://www.wikidata.org/wiki/Q858810","display_name":"Big data","level":2,"score":0.5460673570632935},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.4713522791862488},{"id":"https://openalex.org/C110875604","wikidata":"https://www.wikidata.org/wiki/Q75","display_name":"The Internet","level":2,"score":0.42473095655441284},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.3219665288925171},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.2185879349708557},{"id":"https://openalex.org/C21547014","wikidata":"https://www.wikidata.org/wiki/Q1423657","display_name":"Operations management","level":1,"score":0.0},{"id":"https://openalex.org/C187736073","wikidata":"https://www.wikidata.org/wiki/Q2920921","display_name":"Management","level":1,"score":0.0},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/hpcc-css-icess.2015.170","is_oa":false,"landing_page_url":"https://doi.org/10.1109/hpcc-css-icess.2015.170","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2015 IEEE 17th International Conference on High Performance Computing and Communications, 2015 IEEE 7th International Symposium on Cyberspace Safety and Security, and 2015 IEEE 12th International Conference on Embedded Software and Systems","raw_type":"proceedings-article"},{"id":"pmh:oai:publications.polymtl.ca:35078","is_oa":false,"landing_page_url":"https://publications.polymtl.ca/35078/","pdf_url":null,"source":{"id":"https://openalex.org/S4306401013","display_name":"PolyPublie (\u00c9cole Polytechnique de Montr\u00e9al)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I45683168","host_organization_name":"Polytechnique Montr\u00e9al","host_organization_lineage":["https://openalex.org/I45683168"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"Communication de conf\u00e9rence"}],"best_oa_location":null,"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/8","score":0.4699999988079071,"display_name":"Decent work and economic growth"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":20,"referenced_works":["https://openalex.org/W1465342908","https://openalex.org/W1527311855","https://openalex.org/W1646816738","https://openalex.org/W1967903840","https://openalex.org/W2009543464","https://openalex.org/W2028617807","https://openalex.org/W2030826766","https://openalex.org/W2031513172","https://openalex.org/W2031679758","https://openalex.org/W2040615655","https://openalex.org/W2044372531","https://openalex.org/W2062819966","https://openalex.org/W2067417994","https://openalex.org/W2072362295","https://openalex.org/W2088943669","https://openalex.org/W2142262986","https://openalex.org/W2173213060","https://openalex.org/W4243562335","https://openalex.org/W4293857795","https://openalex.org/W6628746613"],"related_works":["https://openalex.org/W1992029172","https://openalex.org/W1975475533","https://openalex.org/W1978877834","https://openalex.org/W2046153241","https://openalex.org/W4309639895","https://openalex.org/W2098247609","https://openalex.org/W2028004384","https://openalex.org/W1497369337","https://openalex.org/W1604247006","https://openalex.org/W2134835513"],"abstract_inverted_index":{"Cloud":[0],"Computing":[1],"has":[2],"emerged":[3],"as":[4,34],"a":[5,124,169,175,211,227],"key":[6],"technology":[7],"to":[8,37,140,172,178,206,260],"deliver":[9],"and":[10,14,44,71,99,174,193,223],"manage":[11],"computing,":[12],"platform,":[13],"software":[15],"services":[16,33],"over":[17],"the":[18,28,39,56,62,66,72,90,105,116,120,142,182,189,199,215,224,242,250],"Internet.":[19],"Task":[20],"scheduling":[21,50,121],"algorithms":[22,51,82],"play":[23],"an":[24,263],"important":[25],"role":[26],"in":[27,55,89],"efficiency":[29],"of":[30,42,69,74,86,108,118,123,145,185,201,218,226,244,252,265],"cloud":[31,59,91],"computing":[32,60],"they":[35,196],"aim":[36],"reduce":[38,141],"turnaround":[40],"time":[41,144],"tasks":[43,70,78,97,134,150,203],"improve":[45,198],"resource":[46,100],"utilization.":[47],"Several":[48],"task":[49,125,166],"have":[52],"been":[53],"proposed":[54],"literature":[57],"for":[58],"systems,":[61],"majority":[63],"relying":[64],"on":[65],"computational":[67],"complexity":[68],"distribution":[73],"resources.":[75],"However,":[76],"several":[77],"scheduled":[79],"following":[80],"these":[81],"still":[83],"fail":[84],"because":[85],"unforeseen":[87],"changes":[88],"environments.":[92],"In":[93],"this":[94],"paper,":[95],"using":[96,126,188,214],"execution":[98,106,143],"utilization":[101],"data":[102],"extracted":[103],"from":[104,233],"traces":[107],"real":[109],"world":[110],"applications":[111],"at":[112],"Google,":[113],"we":[114,130,136],"explore":[115],"possibility":[117],"predicting":[119],"outcome":[122],"statistical":[127,162],"models.":[128],"If":[129],"can":[131,164,197,255],"successfully":[132],"predict":[133,165],"failures,":[135],"may":[137],"be":[138,256],"able":[139],"jobs":[146,225,254],"by":[147,204,258],"rescheduling":[148],"failed":[149,253],"earlier":[151],"(i.e.,":[152],"before":[153],"their":[154],"actual":[155],"failing":[156],"time).":[157],"Our":[158],"results":[159],"show":[160],"that":[161,195,239],"models":[163],"failures":[167],"with":[168,246,262],"precision":[170],"up":[171,177,205,259],"97.4%,":[173],"recall":[176],"96.2%.":[179],"We":[180,208,237],"simulate":[181],"potential":[183],"benefits":[184],"such":[186],"predictions":[187],"tool":[190],"kit":[191],"GloudSim":[192],"found":[194],"number":[200],"finished":[202],"40%.":[207],"also":[209],"perform":[210],"case":[212],"study":[213,232],"Hadoop":[216,245],"framework":[217],"Amazon":[219],"Elastic":[220],"MapReduce":[221],"(EMR)":[222],"gene":[228],"expression":[229],"correlations":[230],"analysis":[231],"breast":[234],"cancer":[235],"research.":[236],"find":[238],"when":[240],"extending":[241],"scheduler":[243],"our":[247],"predictive":[248],"models,":[249],"percentage":[251],"reduced":[257],"45%,":[261],"overhead":[264],"less":[266],"than":[267],"5":[268],"minutes.":[269]},"counts_by_year":[{"year":2025,"cited_by_count":2},{"year":2024,"cited_by_count":2},{"year":2023,"cited_by_count":5},{"year":2022,"cited_by_count":7},{"year":2021,"cited_by_count":4},{"year":2020,"cited_by_count":1},{"year":2019,"cited_by_count":2},{"year":2018,"cited_by_count":2},{"year":2017,"cited_by_count":2},{"year":2015,"cited_by_count":2}],"updated_date":"2026-03-20T23:20:44.827607","created_date":"2025-10-10T00:00:00"}
