1234567891011121314151617181920212223242526272829303132333435363738394041424344454647484950515253545556575859606162636465666768697071727374757677787980818283848586878889909192939495969798991001011021031041051061071081091101111121131141151161171181191201211221231241251261271281291301311321331341351361371381391401411421431441451461471481491501511521531541551561571581591601611621631641651661671681691701711721731741751761771781791801811821831841851861871881891901911921931941951961971981992002012022032042052062072082092102112122132142152162172182192202212222232242252262272282292302312322332342352362372382392402412422432442452462472482492502512522532542552562572582592602612622632642652662672682692702712722732742752762772782792802812822832842852862872882892902912922932942952962972982993003013023033043053063073083093103113123133143153163173183193203213223233243253263273283293303313323333343353363373383393403413423433443453463473483493503513523533543553563573583593603613623633643653663673683693703713723733743753763773783793803813823833843853863873883893903913923933943953963973983994004014024034044054064074084094104114124134144154164174184194204214224234244254264274284294304314324334344354364374384394404414424434444454464474484494504514524534544554564574584594604614624634644654664674684694704714724734744754764774784794804814824834844854864874884894904914924934944954964974984995005015025035045055065075085095105115125135145155165175185195205215225235245255265275285295305315325335345355365375385395405415425435445455465475485495505515525535545555565575585595605615625635645655665675685695705715725735745755765775785795805815825835845855865875885895905915925935945955965975985996006016026036046056066076086096106116126136146156166176186196206216226236246256266276286296306316326336346356366376386396406416426436446456466476486496506516526536546556566576586596606616626636646656666676686696706716726736746756766776786796806816826836846856866876886896906916926936946956966976986997007017027037047057067077087097107117127137147157167177187197207217227237247257267277287297307317327337347357367377387397407417427437447457467477487497507517527537547557567577587597607617627637647657667677687697707717727737747757767777787797807817827837847857867877887897907917927937947957967977987998008018028038048058068078088098108118128138148158168178188198208218228238248258268278288298308318328338348358368378388398408418428438448458468478488498508518528538548558568578588598608618628638648658668678688698708718728738748758768778788798808818828838848858868878888898908918928938948958968978988999009019029039049059069079089099109119129139149159169179189199209219229239249259269279289299309319329339349359369379389399409419429439449459469479489499509519529539549559569579589599609619629639649659669679689699709719729739749759769779789799809819829839849859869879889899909919929939949959969979989991000100110021003100410051006100710081009101010111012101310141015101610171018101910201021102210231024102510261027102810291030103110321033103410351036103710381039104010411042104310441045104610471048104910501051105210531054105510561057105810591060106110621063106410651066106710681069107010711072107310741075107610771078107910801081108210831084108510861087108810891090109110921093109410951096109710981099110011011102110311041105110611071108110911101111111211131114111511161117111811191120112111221123112411251126112711281129113011311132113311341135113611371138113911401141114211431144114511461147114811491150115111521153115411551156115711581159116011611162116311641165116611671168116911701171117211731174117511761177117811791180118111821183118411851186118711881189119011911192119311941195119611971198119912001201120212031204120512061207120812091210121112121213121412151216121712181219122012211222122312241225122612271228122912301231123212331234123512361237123812391240124112421243124412451246124712481249125012511252125312541255125612571258125912601261126212631264126512661267126812691270127112721273127412751276127712781279128012811282128312841285128612871288128912901291129212931294129512961297129812991300130113021303130413051306130713081309131013111312131313141315131613171318131913201321132213231324132513261327132813291330133113321333133413351336133713381339134013411342134313441345134613471348134913501351135213531354135513561357135813591360136113621363136413651366136713681369137013711372137313741375137613771378137913801381138213831384138513861387138813891390139113921393139413951396139713981399140014011402140314041405140614071408140914101411141214131414141514161417141814191420142114221423142414251426142714281429143014311432143314341435143614371438143914401441144214431444144514461447144814491450145114521453145414551456145714581459146014611462146314641465146614671468146914701471147214731474147514761477147814791480148114821483148414851486148714881489149014911492149314941495149614971498149915001501150215031504150515061507150815091510151115121513151415151516151715181519152015211522152315241525152615271528152915301531153215331534153515361537153815391540154115421543154415451546154715481549155015511552155315541555155615571558155915601561156215631564156515661567156815691570157115721573157415751576157715781579158015811582158315841585158615871588158915901591159215931594159515961597159815991600160116021603160416051606160716081609161016111612161316141615161616171618161916201621162216231624162516261627162816291630163116321633163416351636163716381639164016411642164316441645164616471648164916501651165216531654165516561657165816591660166116621663166416651666166716681669167016711672167316741675167616771678167916801681168216831684168516861687168816891690169116921693169416951696169716981699170017011702170317041705170617071708170917101711171217131714171517161717171817191720172117221723172417251726172717281729173017311732173317341735173617371738173917401741174217431744174517461747174817491750175117521753175417551756175717581759176017611762176317641765176617671768176917701771177217731774177517761777177817791780178117821783178417851786178717881789179017911792179317941795179617971798179918001801180218031804180518061807180818091810181118121813181418151816181718181819182018211822182318241825182618271828182918301831183218331834183518361837183818391840184118421843184418451846184718481849185018511852185318541855185618571858185918601861186218631864186518661867186818691870187118721873187418751876187718781879188018811882188318841885188618871888188918901891189218931894189518961897189818991900190119021903190419051906190719081909191019111912191319141915191619171918191919201921192219231924192519261927192819291930193119321933193419351936193719381939194019411942194319441945194619471948194919501951195219531954195519561957195819591960196119621963196419651966196719681969197019711972197319741975197619771978197919801981198219831984198519861987198819891990199119921993199419951996199719981999200020012002200320042005200620072008200920102011201220132014201520162017201820192020202120222023202420252026202720282029203020312032203320342035203620372038203920402041204220432044204520462047204820492050205120522053205420552056205720582059206020612062206320642065206620672068206920702071207220732074207520762077207820792080208120822083208420852086208720882089209020912092209320942095209620972098209921002101210221032104210521062107210821092110211121122113211421152116211721182119212021212122212321242125212621272128212921302131213221332134213521362137213821392140214121422143214421452146214721482149215021512152215321542155215621572158215921602161216221632164216521662167216821692170217121722173217421752176217721782179218021812182218321842185218621872188218921902191219221932194219521962197219821992200220122022203220422052206220722082209221022112212221322142215221622172218221922202221222222232224222522262227222822292230223122322233223422352236223722382239224022412242224322442245224622472248224922502251225222532254225522562257225822592260226122622263226422652266226722682269227022712272227322742275227622772278227922802281228222832284228522862287228822892290229122922293229422952296229722982299230023012302230323042305230623072308230923102311231223132314231523162317231823192320232123222323232423252326232723282329233023312332233323342335233623372338233923402341234223432344234523462347234823492350235123522353235423552356235723582359236023612362236323642365236623672368236923702371237223732374237523762377237823792380238123822383238423852386238723882389239023912392239323942395239623972398239924002401240224032404240524062407240824092410241124122413241424152416241724182419242024212422242324242425242624272428242924302431243224332434243524362437243824392440244124422443244424452446244724482449245024512452245324542455245624572458245924602461246224632464246524662467246824692470247124722473247424752476247724782479248024812482248324842485248624872488248924902491249224932494249524962497249824992500250125022503250425052506250725082509251025112512251325142515251625172518251925202521252225232524252525262527252825292530253125322533253425352536253725382539254025412542254325442545254625472548254925502551255225532554255525562557255825592560256125622563256425652566256725682569257025712572257325742575257625772578257925802581258225832584258525862587258825892590259125922593259425952596259725982599260026012602260326042605260626072608260926102611261226132614261526162617261826192620262126222623262426252626262726282629263026312632263326342635263626372638263926402641264226432644264526462647264826492650265126522653265426552656265726582659266026612662266326642665266626672668266926702671267226732674267526762677267826792680268126822683268426852686268726882689269026912692269326942695269626972698269927002701270227032704270527062707270827092710271127122713271427152716271727182719272027212722272327242725272627272728272927302731273227332734273527362737273827392740274127422743274427452746274727482749275027512752275327542755275627572758275927602761276227632764276527662767276827692770277127722773277427752776277727782779278027812782278327842785278627872788278927902791279227932794279527962797279827992800280128022803280428052806280728082809281028112812281328142815281628172818281928202821282228232824282528262827282828292830283128322833283428352836283728382839284028412842284328442845284628472848284928502851285228532854285528562857285828592860286128622863286428652866286728682869287028712872287328742875287628772878287928802881288228832884288528862887288828892890289128922893289428952896289728982899290029012902290329042905290629072908290929102911291229132914291529162917291829192920292129222923292429252926292729282929293029312932293329342935293629372938293929402941294229432944294529462947294829492950295129522953295429552956295729582959296029612962296329642965296629672968296929702971297229732974297529762977297829792980298129822983298429852986298729882989299029912992299329942995299629972998299930003001300230033004300530063007300830093010301130123013301430153016301730183019302030213022302330243025302630273028302930303031303230333034303530363037303830393040304130423043304430453046304730483049305030513052305330543055305630573058305930603061306230633064306530663067306830693070307130723073307430753076307730783079308030813082308330843085308630873088308930903091309230933094309530963097309830993100310131023103310431053106310731083109311031113112311331143115311631173118311931203121312231233124312531263127312831293130313131323133313431353136313731383139314031413142314331443145314631473148314931503151315231533154315531563157315831593160316131623163316431653166316731683169317031713172317331743175317631773178317931803181318231833184318531863187318831893190319131923193319431953196319731983199320032013202320332043205320632073208320932103211321232133214321532163217321832193220322132223223322432253226322732283229323032313232323332343235323632373238323932403241324232433244324532463247324832493250325132523253325432553256325732583259326032613262326332643265326632673268326932703271327232733274327532763277327832793280328132823283328432853286328732883289329032913292329332943295329632973298329933003301330233033304330533063307330833093310331133123313331433153316331733183319332033213322332333243325332633273328332933303331333233333334333533363337333833393340334133423343334433453346334733483349335033513352335333543355335633573358335933603361336233633364336533663367336833693370337133723373337433753376337733783379338033813382338333843385338633873388338933903391339233933394339533963397339833993400340134023403340434053406340734083409341034113412341334143415341634173418341934203421342234233424342534263427342834293430343134323433343434353436343734383439344034413442344334443445344634473448344934503451345234533454345534563457345834593460346134623463346434653466346734683469347034713472347334743475347634773478347934803481348234833484348534863487348834893490349134923493349434953496349734983499350035013502350335043505350635073508350935103511351235133514351535163517351835193520352135223523352435253526352735283529353035313532353335343535353635373538353935403541354235433544354535463547354835493550355135523553355435553556355735583559356035613562356335643565356635673568356935703571357235733574357535763577357835793580358135823583358435853586358735883589359035913592359335943595359635973598359936003601360236033604360536063607360836093610361136123613361436153616361736183619362036213622362336243625362636273628362936303631363236333634363536363637363836393640364136423643364436453646364736483649365036513652365336543655365636573658365936603661366236633664366536663667366836693670367136723673367436753676367736783679368036813682368336843685368636873688368936903691369236933694369536963697369836993700370137023703370437053706370737083709371037113712371337143715371637173718371937203721372237233724372537263727372837293730373137323733373437353736373737383739374037413742374337443745374637473748374937503751375237533754375537563757375837593760376137623763376437653766376737683769377037713772377337743775377637773778377937803781378237833784378537863787378837893790379137923793379437953796379737983799380038013802380338043805380638073808380938103811381238133814381538163817381838193820382138223823382438253826382738283829383038313832383338343835383638373838383938403841384238433844384538463847384838493850385138523853385438553856385738583859386038613862386338643865386638673868386938703871387238733874387538763877387838793880388138823883388438853886388738883889389038913892389338943895389638973898389939003901390239033904390539063907390839093910391139123913391439153916391739183919392039213922392339243925392639273928392939303931393239333934393539363937393839393940394139423943394439453946394739483949395039513952395339543955395639573958395939603961396239633964396539663967396839693970397139723973397439753976397739783979398039813982398339843985398639873988398939903991399239933994399539963997399839994000400140024003400440054006400740084009401040114012401340144015401640174018401940204021402240234024402540264027402840294030403140324033403440354036403740384039404040414042404340444045404640474048404940504051405240534054405540564057405840594060406140624063406440654066406740684069407040714072407340744075407640774078407940804081408240834084408540864087408840894090409140924093409440954096409740984099410041014102410341044105410641074108410941104111411241134114411541164117411841194120412141224123412441254126412741284129413041314132413341344135413641374138413941404141414241434144414541464147414841494150415141524153415441554156415741584159416041614162416341644165416641674168416941704171417241734174417541764177417841794180418141824183418441854186418741884189419041914192419341944195419641974198419942004201420242034204420542064207420842094210421142124213421442154216421742184219422042214222422342244225422642274228422942304231423242334234423542364237423842394240424142424243424442454246424742484249425042514252425342544255425642574258425942604261426242634264426542664267426842694270427142724273427442754276427742784279428042814282428342844285428642874288428942904291429242934294429542964297429842994300430143024303430443054306430743084309431043114312431343144315431643174318431943204321432243234324432543264327432843294330433143324333433443354336433743384339434043414342434343444345434643474348434943504351435243534354435543564357435843594360436143624363436443654366436743684369437043714372437343744375437643774378437943804381438243834384438543864387438843894390439143924393439443954396439743984399440044014402440344044405440644074408440944104411441244134414441544164417441844194420442144224423442444254426442744284429443044314432443344344435443644374438443944404441444244434444444544464447444844494450445144524453445444554456445744584459446044614462446344644465446644674468446944704471447244734474447544764477447844794480448144824483448444854486448744884489449044914492449344944495449644974498449945004501450245034504450545064507450845094510451145124513451445154516451745184519452045214522452345244525452645274528452945304531453245334534453545364537453845394540454145424543454445454546454745484549455045514552455345544555455645574558455945604561456245634564456545664567456845694570457145724573457445754576457745784579458045814582458345844585458645874588458945904591459245934594459545964597459845994600460146024603460446054606460746084609461046114612461346144615461646174618461946204621462246234624462546264627462846294630463146324633463446354636463746384639464046414642464346444645464646474648464946504651465246534654465546564657465846594660466146624663466446654666466746684669467046714672467346744675467646774678467946804681468246834684468546864687468846894690469146924693469446954696469746984699470047014702470347044705470647074708470947104711471247134714471547164717471847194720472147224723472447254726472747284729473047314732473347344735473647374738473947404741474247434744474547464747474847494750475147524753475447554756475747584759476047614762476347644765476647674768476947704771477247734774477547764777477847794780478147824783478447854786478747884789479047914792479347944795479647974798479948004801480248034804480548064807480848094810481148124813481448154816481748184819482048214822482348244825482648274828482948304831483248334834483548364837483848394840484148424843484448454846484748484849485048514852485348544855485648574858485948604861486248634864486548664867486848694870487148724873487448754876487748784879488048814882488348844885488648874888488948904891489248934894489548964897489848994900490149024903490449054906490749084909491049114912491349144915491649174918491949204921492249234924492549264927492849294930493149324933493449354936493749384939494049414942494349444945494649474948494949504951495249534954495549564957495849594960496149624963496449654966496749684969497049714972497349744975497649774978497949804981498249834984498549864987498849894990499149924993499449954996499749984999500050015002500350045005500650075008500950105011501250135014501550165017501850195020502150225023502450255026502750285029503050315032503350345035503650375038503950405041504250435044504550465047504850495050505150525053505450555056505750585059506050615062506350645065506650675068506950705071507250735074507550765077507850795080508150825083508450855086508750885089509050915092509350945095509650975098509951005101510251035104510551065107510851095110511151125113511451155116511751185119512051215122512351245125512651275128512951305131513251335134513551365137513851395140514151425143514451455146514751485149515051515152515351545155515651575158515951605161516251635164516551665167516851695170517151725173517451755176517751785179518051815182518351845185518651875188518951905191519251935194519551965197519851995200520152025203520452055206520752085209521052115212521352145215521652175218521952205221522252235224522552265227522852295230523152325233523452355236523752385239524052415242524352445245524652475248524952505251525252535254525552565257525852595260526152625263526452655266526752685269527052715272527352745275527652775278527952805281528252835284528552865287528852895290529152925293529452955296529752985299530053015302530353045305530653075308530953105311531253135314531553165317531853195320532153225323532453255326532753285329533053315332533353345335533653375338533953405341534253435344534553465347534853495350535153525353535453555356535753585359536053615362536353645365536653675368536953705371537253735374537553765377537853795380538153825383538453855386538753885389539053915392539353945395539653975398539954005401540254035404540554065407540854095410541154125413541454155416541754185419542054215422542354245425542654275428542954305431543254335434543554365437543854395440544154425443544454455446544754485449545054515452545354545455545654575458545954605461546254635464546554665467546854695470547154725473547454755476547754785479548054815482548354845485548654875488548954905491549254935494549554965497549854995500550155025503550455055506550755085509551055115512551355145515551655175518551955205521552255235524552555265527552855295530553155325533553455355536553755385539554055415542554355445545554655475548554955505551555255535554555555565557555855595560556155625563556455655566556755685569557055715572557355745575557655775578557955805581558255835584558555865587558855895590559155925593559455955596559755985599560056015602560356045605560656075608560956105611561256135614561556165617561856195620562156225623562456255626562756285629563056315632563356345635563656375638563956405641564256435644564556465647564856495650565156525653565456555656565756585659566056615662566356645665566656675668566956705671567256735674567556765677567856795680568156825683568456855686568756885689569056915692569356945695569656975698569957005701570257035704570557065707570857095710571157125713571457155716571757185719572057215722572357245725572657275728572957305731573257335734573557365737573857395740574157425743574457455746574757485749575057515752575357545755575657575758575957605761576257635764576557665767576857695770577157725773577457755776577757785779578057815782578357845785578657875788578957905791579257935794579557965797579857995800580158025803580458055806580758085809581058115812 |
- <!doctype html>
- <html lang="en" class="no-js">
- <head>
-
- <meta charset="utf-8">
- <meta name="viewport" content="width=device-width,initial-scale=1">
-
-
-
-
- <link rel="prev" href="../">
-
-
- <link rel="next" href="../models/">
-
-
- <link rel="icon" href="../../assets/images/favicon.png">
- <meta name="generator" content="mkdocs-1.6.1, mkdocs-material-9.5.40">
-
-
-
- <title>Agent - SWE-agent documentation</title>
-
-
-
- <link rel="stylesheet" href="../../assets/stylesheets/main.8c3ca2c6.min.css">
-
-
- <link rel="stylesheet" href="../../assets/stylesheets/palette.06af60db.min.css">
-
-
-
-
-
-
-
-
-
-
- <link rel="preconnect" href="https://fonts.gstatic.com" crossorigin>
- <link rel="stylesheet" href="https://fonts.googleapis.com/css?family=Roboto:300,300i,400,400i,700,700i%7CRoboto+Mono:400,400i,700,700i&display=fallback">
- <style>:root{--md-text-font:"Roboto";--md-code-font:"Roboto Mono"}</style>
-
-
-
- <link rel="stylesheet" href="../../assets/_mkdocstrings.css">
-
- <link rel="stylesheet" href="../../assets/custom.css">
-
- <script>__md_scope=new URL("../..",location),__md_hash=e=>[...e].reduce(((e,_)=>(e<<5)-e+_.charCodeAt(0)),0),__md_get=(e,_=localStorage,t=__md_scope)=>JSON.parse(_.getItem(t.pathname+"."+e)),__md_set=(e,_,t=localStorage,a=__md_scope)=>{try{t.setItem(a.pathname+"."+e,JSON.stringify(_))}catch(e){}}</script>
-
-
-
-
-
- <link href="../../assets/stylesheets/glightbox.min.css" rel="stylesheet"/><style>
- html.glightbox-open { overflow: initial; height: 100%; }
- .gslide-title { margin-top: 0px; user-select: text; }
- .gslide-desc { color: #666; user-select: text; }
- .gslide-image img { background: white; }
- .gscrollbar-fixer { padding-right: 15px; }
- .gdesc-inner { font-size: 0.75rem; }
- body[data-md-color-scheme="slate"] .gdesc-inner { background: var(--md-default-bg-color);}
- body[data-md-color-scheme="slate"] .gslide-title { color: var(--md-default-fg-color);}
- body[data-md-color-scheme="slate"] .gslide-desc { color: var(--md-default-fg-color);}</style> <script src="../../assets/javascripts/glightbox.min.js"></script></head>
-
-
-
-
-
-
-
-
-
- <body dir="ltr" data-md-color-scheme="default" data-md-color-primary="indigo" data-md-color-accent="indigo">
-
-
- <input class="md-toggle" data-md-toggle="drawer" type="checkbox" id="__drawer" autocomplete="off">
- <input class="md-toggle" data-md-toggle="search" type="checkbox" id="__search" autocomplete="off">
- <label class="md-overlay" for="__drawer"></label>
- <div data-md-component="skip">
-
-
- <a href="#the-agent-class" class="md-skip">
- Skip to content
- </a>
-
- </div>
- <div data-md-component="announce">
-
- <aside class="md-banner">
- <div class="md-banner__inner md-grid md-typeset">
-
- <button class="md-banner__button md-icon" aria-label="Don't show this again">
-
- <svg xmlns="http://www.w3.org/2000/svg" viewBox="0 0 24 24"><path d="M19 6.41 17.59 5 12 10.59 6.41 5 5 6.41 10.59 12 5 17.59 6.41 19 12 13.41 17.59 19 19 17.59 13.41 12z"/></svg>
- </button>
-
-
- <!-- This link won't work in local preview -->
- <a href="SWE-agent/background#enigma" class="clickable-banner">
- <div>
- News: SWE-agent <span class="enigma">EniGMA</span> solves cybersecurity and CTF challanges to achieve <span class="enigma">3x improvement over previous SOTA!</span>
- </div>
- </a>
- </div>
-
- <script>var el=document.querySelector("[data-md-component=announce]");if(el){var content=el.querySelector(".md-typeset");__md_hash(content.innerHTML)===__md_get("__announce")&&(el.hidden=!0)}</script>
-
- </aside>
-
- </div>
-
-
-
-
- <header class="md-header md-header--shadow" data-md-component="header">
- <nav class="md-header__inner md-grid" aria-label="Header">
- <a href="../.." title="SWE-agent documentation" class="md-header__button md-logo" aria-label="SWE-agent documentation" data-md-component="logo">
-
- <img src="../../assets/swe-agent.svg" alt="logo">
- </a>
- <label class="md-header__button md-icon" for="__drawer">
-
- <svg xmlns="http://www.w3.org/2000/svg" viewBox="0 0 24 24"><path d="M3 6h18v2H3zm0 5h18v2H3zm0 5h18v2H3z"/></svg>
- </label>
- <div class="md-header__title" data-md-component="header-title">
- <div class="md-header__ellipsis">
- <div class="md-header__topic">
- <span class="md-ellipsis">
- SWE-agent documentation
- </span>
- </div>
- <div class="md-header__topic" data-md-component="header-topic">
- <span class="md-ellipsis">
-
- Agent
-
- </span>
- </div>
- </div>
- </div>
-
-
- <form class="md-header__option" data-md-component="palette">
-
-
-
-
- <input class="md-option" data-md-color-media="(prefers-color-scheme)" data-md-color-scheme="default" data-md-color-primary="indigo" data-md-color-accent="indigo" aria-label="Switch to light mode" type="radio" name="__palette" id="__palette_0">
-
- <label class="md-header__button md-icon" title="Switch to light mode" for="__palette_1" hidden>
- <svg xmlns="http://www.w3.org/2000/svg" viewBox="0 0 24 24"><path d="m14.3 16-.7-2h-3.2l-.7 2H7.8L11 7h2l3.2 9zM20 8.69V4h-4.69L12 .69 8.69 4H4v4.69L.69 12 4 15.31V20h4.69L12 23.31 15.31 20H20v-4.69L23.31 12zm-9.15 3.96h2.3L12 9z"/></svg>
- </label>
-
-
-
-
-
- <input class="md-option" data-md-color-media="(prefers-color-scheme: light)" data-md-color-scheme="default" data-md-color-primary="black" data-md-color-accent="deep-orange" aria-label="Switch to dark mode" type="radio" name="__palette" id="__palette_1">
-
- <label class="md-header__button md-icon" title="Switch to dark mode" for="__palette_2" hidden>
- <svg xmlns="http://www.w3.org/2000/svg" viewBox="0 0 24 24"><path d="m17.75 4.09-2.53 1.94.91 3.06-2.63-1.81-2.63 1.81.91-3.06-2.53-1.94L12.44 4l1.06-3 1.06 3zm3.5 6.91-1.64 1.25.59 1.98-1.7-1.17-1.7 1.17.59-1.98L15.75 11l2.06-.05L18.5 9l.69 1.95zm-2.28 4.95c.83-.08 1.72 1.1 1.19 1.85-.32.45-.66.87-1.08 1.27C15.17 23 8.84 23 4.94 19.07c-3.91-3.9-3.91-10.24 0-14.14.4-.4.82-.76 1.27-1.08.75-.53 1.93.36 1.85 1.19-.27 2.86.69 5.83 2.89 8.02a9.96 9.96 0 0 0 8.02 2.89m-1.64 2.02a12.08 12.08 0 0 1-7.8-3.47c-2.17-2.19-3.33-5-3.49-7.82-2.81 3.14-2.7 7.96.31 10.98 3.02 3.01 7.84 3.12 10.98.31"/></svg>
- </label>
-
-
-
-
-
- <input class="md-option" data-md-color-media="(prefers-color-scheme: dark)" data-md-color-scheme="slate" data-md-color-primary="black" data-md-color-accent="deep-orange" aria-label="Switch to light mode" type="radio" name="__palette" id="__palette_2">
-
- <label class="md-header__button md-icon" title="Switch to light mode" for="__palette_0" hidden>
- <svg xmlns="http://www.w3.org/2000/svg" viewBox="0 0 24 24"><path d="M12 7a5 5 0 0 1 5 5 5 5 0 0 1-5 5 5 5 0 0 1-5-5 5 5 0 0 1 5-5m0 2a3 3 0 0 0-3 3 3 3 0 0 0 3 3 3 3 0 0 0 3-3 3 3 0 0 0-3-3m0-7 2.39 3.42C13.65 5.15 12.84 5 12 5s-1.65.15-2.39.42zM3.34 7l4.16-.35A7.2 7.2 0 0 0 5.94 8.5c-.44.74-.69 1.5-.83 2.29zm.02 10 1.76-3.77a7.131 7.131 0 0 0 2.38 4.14zM20.65 7l-1.77 3.79a7.02 7.02 0 0 0-2.38-4.15zm-.01 10-4.14.36c.59-.51 1.12-1.14 1.54-1.86.42-.73.69-1.5.83-2.29zM12 22l-2.41-3.44c.74.27 1.55.44 2.41.44.82 0 1.63-.17 2.37-.44z"/></svg>
- </label>
-
-
- </form>
-
-
-
- <script>var palette=__md_get("__palette");if(palette&&palette.color){if("(prefers-color-scheme)"===palette.color.media){var media=matchMedia("(prefers-color-scheme: light)"),input=document.querySelector(media.matches?"[data-md-color-media='(prefers-color-scheme: light)']":"[data-md-color-media='(prefers-color-scheme: dark)']");palette.color.media=input.getAttribute("data-md-color-media"),palette.color.scheme=input.getAttribute("data-md-color-scheme"),palette.color.primary=input.getAttribute("data-md-color-primary"),palette.color.accent=input.getAttribute("data-md-color-accent")}for(var[key,value]of Object.entries(palette.color))document.body.setAttribute("data-md-color-"+key,value)}</script>
-
-
-
- <label class="md-header__button md-icon" for="__search">
-
- <svg xmlns="http://www.w3.org/2000/svg" viewBox="0 0 24 24"><path d="M9.5 3A6.5 6.5 0 0 1 16 9.5c0 1.61-.59 3.09-1.56 4.23l.27.27h.79l5 5-1.5 1.5-5-5v-.79l-.27-.27A6.52 6.52 0 0 1 9.5 16 6.5 6.5 0 0 1 3 9.5 6.5 6.5 0 0 1 9.5 3m0 2C7 5 5 7 5 9.5S7 14 9.5 14 14 12 14 9.5 12 5 9.5 5"/></svg>
- </label>
- <div class="md-search" data-md-component="search" role="dialog">
- <label class="md-search__overlay" for="__search"></label>
- <div class="md-search__inner" role="search">
- <form class="md-search__form" name="search">
- <input type="text" class="md-search__input" name="query" aria-label="Search" placeholder="Search" autocapitalize="off" autocorrect="off" autocomplete="off" spellcheck="false" data-md-component="search-query" required>
- <label class="md-search__icon md-icon" for="__search">
-
- <svg xmlns="http://www.w3.org/2000/svg" viewBox="0 0 24 24"><path d="M9.5 3A6.5 6.5 0 0 1 16 9.5c0 1.61-.59 3.09-1.56 4.23l.27.27h.79l5 5-1.5 1.5-5-5v-.79l-.27-.27A6.52 6.52 0 0 1 9.5 16 6.5 6.5 0 0 1 3 9.5 6.5 6.5 0 0 1 9.5 3m0 2C7 5 5 7 5 9.5S7 14 9.5 14 14 12 14 9.5 12 5 9.5 5"/></svg>
-
- <svg xmlns="http://www.w3.org/2000/svg" viewBox="0 0 24 24"><path d="M20 11v2H8l5.5 5.5-1.42 1.42L4.16 12l7.92-7.92L13.5 5.5 8 11z"/></svg>
- </label>
- <nav class="md-search__options" aria-label="Search">
-
- <button type="reset" class="md-search__icon md-icon" title="Clear" aria-label="Clear" tabindex="-1">
-
- <svg xmlns="http://www.w3.org/2000/svg" viewBox="0 0 24 24"><path d="M19 6.41 17.59 5 12 10.59 6.41 5 5 6.41 10.59 12 5 17.59 6.41 19 12 13.41 17.59 19 19 17.59 13.41 12z"/></svg>
- </button>
- </nav>
-
- </form>
- <div class="md-search__output">
- <div class="md-search__scrollwrap" tabindex="0" data-md-scrollfix>
- <div class="md-search-result" data-md-component="search-result">
- <div class="md-search-result__meta">
- Initializing search
- </div>
- <ol class="md-search-result__list" role="presentation"></ol>
- </div>
- </div>
- </div>
- </div>
- </div>
-
-
- <div class="md-header__source">
- <a href="https://github.com/princeton-nlp/SWE-agent" title="Go to repository" class="md-source" data-md-component="source">
- <div class="md-source__icon md-icon">
-
- <svg xmlns="http://www.w3.org/2000/svg" viewBox="0 0 496 512"><!--! Font Awesome Free 6.6.0 by @fontawesome - https://fontawesome.com License - https://fontawesome.com/license/free (Icons: CC BY 4.0, Fonts: SIL OFL 1.1, Code: MIT License) Copyright 2024 Fonticons, Inc.--><path d="M165.9 397.4c0 2-2.3 3.6-5.2 3.6-3.3.3-5.6-1.3-5.6-3.6 0-2 2.3-3.6 5.2-3.6 3-.3 5.6 1.3 5.6 3.6m-31.1-4.5c-.7 2 1.3 4.3 4.3 4.9 2.6 1 5.6 0 6.2-2s-1.3-4.3-4.3-5.2c-2.6-.7-5.5.3-6.2 2.3m44.2-1.7c-2.9.7-4.9 2.6-4.6 4.9.3 2 2.9 3.3 5.9 2.6 2.9-.7 4.9-2.6 4.6-4.6-.3-1.9-3-3.2-5.9-2.9M244.8 8C106.1 8 0 113.3 0 252c0 110.9 69.8 205.8 169.5 239.2 12.8 2.3 17.3-5.6 17.3-12.1 0-6.2-.3-40.4-.3-61.4 0 0-70 15-84.7-29.8 0 0-11.4-29.1-27.8-36.6 0 0-22.9-15.7 1.6-15.4 0 0 24.9 2 38.6 25.8 21.9 38.6 58.6 27.5 72.9 20.9 2.3-16 8.8-27.1 16-33.7-55.9-6.2-112.3-14.3-112.3-110.5 0-27.5 7.6-41.3 23.6-58.9-2.6-6.5-11.1-33.3 2.6-67.9 20.9-6.5 69 27 69 27 20-5.6 41.5-8.5 62.8-8.5s42.8 2.9 62.8 8.5c0 0 48.1-33.6 69-27 13.7 34.7 5.2 61.4 2.6 67.9 16 17.7 25.8 31.5 25.8 58.9 0 96.5-58.9 104.2-114.8 110.5 9.2 7.9 17 22.9 17 46.4 0 33.7-.3 75.4-.3 83.6 0 6.5 4.6 14.4 17.3 12.1C428.2 457.8 496 362.9 496 252 496 113.3 383.5 8 244.8 8M97.2 352.9c-1.3 1-1 3.3.7 5.2 1.6 1.6 3.9 2.3 5.2 1 1.3-1 1-3.3-.7-5.2-1.6-1.6-3.9-2.3-5.2-1m-10.8-8.1c-.7 1.3.3 2.9 2.3 3.9 1.6 1 3.6.7 4.3-.7.7-1.3-.3-2.9-2.3-3.9-2-.6-3.6-.3-4.3.7m32.4 35.6c-1.6 1.3-1 4.3 1.3 6.2 2.3 2.3 5.2 2.6 6.5 1 1.3-1.3.7-4.3-1.3-6.2-2.2-2.3-5.2-2.6-6.5-1m-11.4-14.7c-1.6 1-1.6 3.6 0 5.9s4.3 3.3 5.6 2.3c1.6-1.3 1.6-3.9 0-6.2-1.4-2.3-4-3.3-5.6-2"/></svg>
- </div>
- <div class="md-source__repository">
- princeton-nlp/SWE-agent
- </div>
- </a>
- </div>
-
- </nav>
-
- </header>
-
- <div class="md-container" data-md-component="container">
-
-
-
-
-
-
- <main class="md-main" data-md-component="main">
- <div class="md-main__inner md-grid">
-
-
-
- <div class="md-sidebar md-sidebar--primary" data-md-component="sidebar" data-md-type="navigation" >
- <div class="md-sidebar__scrollwrap">
- <div class="md-sidebar__inner">
-
- <nav class="md-nav md-nav--primary" aria-label="Navigation" data-md-level="0">
- <label class="md-nav__title" for="__drawer">
- <a href="../.." title="SWE-agent documentation" class="md-nav__button md-logo" aria-label="SWE-agent documentation" data-md-component="logo">
-
- <img src="../../assets/swe-agent.svg" alt="logo">
- </a>
- SWE-agent documentation
- </label>
-
- <div class="md-nav__source">
- <a href="https://github.com/princeton-nlp/SWE-agent" title="Go to repository" class="md-source" data-md-component="source">
- <div class="md-source__icon md-icon">
-
- <svg xmlns="http://www.w3.org/2000/svg" viewBox="0 0 496 512"><!--! Font Awesome Free 6.6.0 by @fontawesome - https://fontawesome.com License - https://fontawesome.com/license/free (Icons: CC BY 4.0, Fonts: SIL OFL 1.1, Code: MIT License) Copyright 2024 Fonticons, Inc.--><path d="M165.9 397.4c0 2-2.3 3.6-5.2 3.6-3.3.3-5.6-1.3-5.6-3.6 0-2 2.3-3.6 5.2-3.6 3-.3 5.6 1.3 5.6 3.6m-31.1-4.5c-.7 2 1.3 4.3 4.3 4.9 2.6 1 5.6 0 6.2-2s-1.3-4.3-4.3-5.2c-2.6-.7-5.5.3-6.2 2.3m44.2-1.7c-2.9.7-4.9 2.6-4.6 4.9.3 2 2.9 3.3 5.9 2.6 2.9-.7 4.9-2.6 4.6-4.6-.3-1.9-3-3.2-5.9-2.9M244.8 8C106.1 8 0 113.3 0 252c0 110.9 69.8 205.8 169.5 239.2 12.8 2.3 17.3-5.6 17.3-12.1 0-6.2-.3-40.4-.3-61.4 0 0-70 15-84.7-29.8 0 0-11.4-29.1-27.8-36.6 0 0-22.9-15.7 1.6-15.4 0 0 24.9 2 38.6 25.8 21.9 38.6 58.6 27.5 72.9 20.9 2.3-16 8.8-27.1 16-33.7-55.9-6.2-112.3-14.3-112.3-110.5 0-27.5 7.6-41.3 23.6-58.9-2.6-6.5-11.1-33.3 2.6-67.9 20.9-6.5 69 27 69 27 20-5.6 41.5-8.5 62.8-8.5s42.8 2.9 62.8 8.5c0 0 48.1-33.6 69-27 13.7 34.7 5.2 61.4 2.6 67.9 16 17.7 25.8 31.5 25.8 58.9 0 96.5-58.9 104.2-114.8 110.5 9.2 7.9 17 22.9 17 46.4 0 33.7-.3 75.4-.3 83.6 0 6.5 4.6 14.4 17.3 12.1C428.2 457.8 496 362.9 496 252 496 113.3 383.5 8 244.8 8M97.2 352.9c-1.3 1-1 3.3.7 5.2 1.6 1.6 3.9 2.3 5.2 1 1.3-1 1-3.3-.7-5.2-1.6-1.6-3.9-2.3-5.2-1m-10.8-8.1c-.7 1.3.3 2.9 2.3 3.9 1.6 1 3.6.7 4.3-.7.7-1.3-.3-2.9-2.3-3.9-2-.6-3.6-.3-4.3.7m32.4 35.6c-1.6 1.3-1 4.3 1.3 6.2 2.3 2.3 5.2 2.6 6.5 1 1.3-1.3.7-4.3-1.3-6.2-2.2-2.3-5.2-2.6-6.5-1m-11.4-14.7c-1.6 1-1.6 3.6 0 5.9s4.3 3.3 5.6 2.3c1.6-1.3 1.6-3.9 0-6.2-1.4-2.3-4-3.3-5.6-2"/></svg>
- </div>
- <div class="md-source__repository">
- princeton-nlp/SWE-agent
- </div>
- </a>
- </div>
-
- <ul class="md-nav__list" data-md-scrollfix>
-
-
-
-
-
-
-
- <li class="md-nav__item">
- <a href="../.." class="md-nav__link">
-
-
- <span class="md-ellipsis">
- Home
- </span>
-
- </a>
- </li>
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
- <li class="md-nav__item md-nav__item--nested">
-
-
-
- <input class="md-nav__toggle md-toggle " type="checkbox" id="__nav_2" >
-
-
-
- <div class="md-nav__link md-nav__container">
- <a href="../../background/" class="md-nav__link ">
-
-
- <span class="md-ellipsis">
- Project Overview
- </span>
-
- </a>
-
-
- <label class="md-nav__link " for="__nav_2" id="__nav_2_label" tabindex="0">
- <span class="md-nav__icon md-icon"></span>
- </label>
-
- </div>
-
- <nav class="md-nav" data-md-level="1" aria-labelledby="__nav_2_label" aria-expanded="false">
- <label class="md-nav__title" for="__nav_2">
- <span class="md-nav__icon md-icon"></span>
- Project Overview
- </label>
- <ul class="md-nav__list" data-md-scrollfix>
-
-
-
-
-
-
-
-
-
- <li class="md-nav__item">
- <a href="../../background/aci/" class="md-nav__link">
-
-
- <span class="md-ellipsis">
- Agent-Computer Interface
- </span>
-
- </a>
- </li>
-
-
-
-
-
-
-
-
-
- <li class="md-nav__item">
- <a href="../../background/iat/" class="md-nav__link">
-
-
- <span class="md-ellipsis">
- Interactive Agent Tools
- </span>
-
- </a>
- </li>
-
-
-
-
-
-
-
-
-
- <li class="md-nav__item">
- <a href="../../background/architecture/" class="md-nav__link">
-
-
- <span class="md-ellipsis">
- Architecture
- </span>
-
- </a>
- </li>
-
-
-
- </ul>
- </nav>
-
- </li>
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
- <li class="md-nav__item md-nav__item--nested">
-
-
-
- <input class="md-nav__toggle md-toggle " type="checkbox" id="__nav_3" >
-
-
-
- <div class="md-nav__link md-nav__container">
- <a href="../../installation/" class="md-nav__link ">
-
-
- <span class="md-ellipsis">
- Installation
- </span>
-
- </a>
-
-
- <label class="md-nav__link " for="__nav_3" id="__nav_3_label" tabindex="0">
- <span class="md-nav__icon md-icon"></span>
- </label>
-
- </div>
-
- <nav class="md-nav" data-md-level="1" aria-labelledby="__nav_3_label" aria-expanded="false">
- <label class="md-nav__title" for="__nav_3">
- <span class="md-nav__icon md-icon"></span>
- Installation
- </label>
- <ul class="md-nav__list" data-md-scrollfix>
-
-
-
-
-
-
-
-
-
- <li class="md-nav__item">
- <a href="../../installation/codespaces/" class="md-nav__link">
-
-
- <span class="md-ellipsis">
- Use in-browser
- </span>
-
- </a>
- </li>
-
-
-
-
-
-
-
-
-
- <li class="md-nav__item">
- <a href="../../installation/source/" class="md-nav__link">
-
-
- <span class="md-ellipsis">
- Install from source
- </span>
-
- </a>
- </li>
-
-
-
-
-
-
-
-
-
- <li class="md-nav__item">
- <a href="../../installation/docker/" class="md-nav__link">
-
-
- <span class="md-ellipsis">
- Run with docker
- </span>
-
- </a>
- </li>
-
-
-
-
-
-
-
-
-
- <li class="md-nav__item">
- <a href="../../installation/keys/" class="md-nav__link">
-
-
- <span class="md-ellipsis">
- API keys
- </span>
-
- </a>
- </li>
-
-
-
-
-
-
-
-
-
- <li class="md-nav__item">
- <a href="../../installation/tips/" class="md-nav__link">
-
-
- <span class="md-ellipsis">
- Installation tips
- </span>
-
- </a>
- </li>
-
-
-
-
-
-
-
-
-
- <li class="md-nav__item">
- <a href="../../installation/changelog/" class="md-nav__link">
-
-
- <span class="md-ellipsis">
- Changelog
- </span>
-
- </a>
- </li>
-
-
-
- </ul>
- </nav>
-
- </li>
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
- <li class="md-nav__item md-nav__item--nested">
-
-
-
- <input class="md-nav__toggle md-toggle " type="checkbox" id="__nav_4" >
-
-
-
- <div class="md-nav__link md-nav__container">
- <a href="../../usage/" class="md-nav__link ">
-
-
- <span class="md-ellipsis">
- Usage
- </span>
-
- </a>
-
-
- <label class="md-nav__link " for="__nav_4" id="__nav_4_label" tabindex="0">
- <span class="md-nav__icon md-icon"></span>
- </label>
-
- </div>
-
- <nav class="md-nav" data-md-level="1" aria-labelledby="__nav_4_label" aria-expanded="false">
- <label class="md-nav__title" for="__nav_4">
- <span class="md-nav__icon md-icon"></span>
- Usage
- </label>
- <ul class="md-nav__list" data-md-scrollfix>
-
-
-
-
-
-
-
-
-
- <li class="md-nav__item">
- <a href="../../usage/cl_tutorial/" class="md-nav__link">
-
-
- <span class="md-ellipsis">
- Command line usage
- </span>
-
- </a>
- </li>
-
-
-
-
-
-
-
-
-
- <li class="md-nav__item">
- <a href="../../usage/enigma/" class="md-nav__link">
-
-
- <span class="md-ellipsis">
- EnIGMA usage
- </span>
-
- </a>
- </li>
-
-
-
-
-
-
-
-
-
- <li class="md-nav__item">
- <a href="../../usage/coding_challenges/" class="md-nav__link">
-
-
- <span class="md-ellipsis">
- Solving coding challenges
- </span>
-
- </a>
- </li>
-
-
-
-
-
-
-
-
-
- <li class="md-nav__item">
- <a href="../../usage/web_ui/" class="md-nav__link">
-
-
- <span class="md-ellipsis">
- Using the web UI
- </span>
-
- </a>
- </li>
-
-
-
-
-
-
-
-
-
- <li class="md-nav__item">
- <a href="../../usage/trajectories/" class="md-nav__link">
-
-
- <span class="md-ellipsis">
- Trajectories
- </span>
-
- </a>
- </li>
-
-
-
-
-
-
-
-
-
- <li class="md-nav__item">
- <a href="../../usage/inspector/" class="md-nav__link">
-
-
- <span class="md-ellipsis">
- Trajectory inspector
- </span>
-
- </a>
- </li>
-
-
-
-
-
-
-
-
-
- <li class="md-nav__item">
- <a href="../../usage/usage_faq/" class="md-nav__link">
-
-
- <span class="md-ellipsis">
- FAQ
- </span>
-
- </a>
- </li>
-
-
-
-
-
-
-
-
-
- <li class="md-nav__item">
- <a href="../../usage/benchmarking/" class="md-nav__link">
-
-
- <span class="md-ellipsis">
- Benchmarking
- </span>
-
- </a>
- </li>
-
-
-
- </ul>
- </nav>
-
- </li>
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
- <li class="md-nav__item md-nav__item--nested">
-
-
-
- <input class="md-nav__toggle md-toggle " type="checkbox" id="__nav_5" >
-
-
- <label class="md-nav__link" for="__nav_5" id="__nav_5_label" tabindex="0">
-
-
- <span class="md-ellipsis">
- Configuration
- </span>
-
- <span class="md-nav__icon md-icon"></span>
- </label>
-
- <nav class="md-nav" data-md-level="1" aria-labelledby="__nav_5_label" aria-expanded="false">
- <label class="md-nav__title" for="__nav_5">
- <span class="md-nav__icon md-icon"></span>
- Configuration
- </label>
- <ul class="md-nav__list" data-md-scrollfix>
-
-
-
-
-
-
-
- <li class="md-nav__item">
- <a href="../../config/config/" class="md-nav__link">
-
-
- <span class="md-ellipsis">
- Config files
- </span>
-
- </a>
- </li>
-
-
-
-
-
-
-
-
-
- <li class="md-nav__item">
- <a href="../../config/commands/" class="md-nav__link">
-
-
- <span class="md-ellipsis">
- Command definitions
- </span>
-
- </a>
- </li>
-
-
-
-
-
-
-
-
-
- <li class="md-nav__item">
- <a href="../../config/demonstrations/" class="md-nav__link">
-
-
- <span class="md-ellipsis">
- Demonstrations
- </span>
-
- </a>
- </li>
-
-
-
-
-
-
-
-
-
- <li class="md-nav__item">
- <a href="../../config/env/" class="md-nav__link">
-
-
- <span class="md-ellipsis">
- Environment variables
- </span>
-
- </a>
- </li>
-
-
-
-
-
-
-
-
-
- <li class="md-nav__item">
- <a href="../../config/docker/" class="md-nav__link">
-
-
- <span class="md-ellipsis">
- Docker images
- </span>
-
- </a>
- </li>
-
-
-
-
-
-
-
-
-
- <li class="md-nav__item">
- <a href="../../config/summarizers/" class="md-nav__link">
-
-
- <span class="md-ellipsis">
- Summarizers
- </span>
-
- </a>
- </li>
-
-
-
- </ul>
- </nav>
-
- </li>
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
- <li class="md-nav__item md-nav__item--nested">
-
-
-
- <input class="md-nav__toggle md-toggle " type="checkbox" id="__nav_6" >
-
-
- <label class="md-nav__link" for="__nav_6" id="__nav_6_label" tabindex="0">
-
-
- <span class="md-ellipsis">
- Development
- </span>
-
- <span class="md-nav__icon md-icon"></span>
- </label>
-
- <nav class="md-nav" data-md-level="1" aria-labelledby="__nav_6_label" aria-expanded="false">
- <label class="md-nav__title" for="__nav_6">
- <span class="md-nav__icon md-icon"></span>
- Development
- </label>
- <ul class="md-nav__list" data-md-scrollfix>
-
-
-
-
-
-
-
- <li class="md-nav__item">
- <a href="../../dev/contribute/" class="md-nav__link">
-
-
- <span class="md-ellipsis">
- Contribution guide
- </span>
-
- </a>
- </li>
-
-
-
-
-
-
-
-
-
- <li class="md-nav__item">
- <a href="../../dev/formatting_conflicts/" class="md-nav__link">
-
-
- <span class="md-ellipsis">
- Formatting conflicts
- </span>
-
- </a>
- </li>
-
-
-
- </ul>
- </nav>
-
- </li>
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
- <li class="md-nav__item md-nav__item--active md-nav__item--nested">
-
-
-
- <input class="md-nav__toggle md-toggle " type="checkbox" id="__nav_7" checked>
-
-
-
- <div class="md-nav__link md-nav__container">
- <a href="../" class="md-nav__link ">
-
-
- <span class="md-ellipsis">
- Reference
- </span>
-
- </a>
-
-
- <label class="md-nav__link " for="__nav_7" id="__nav_7_label" tabindex="0">
- <span class="md-nav__icon md-icon"></span>
- </label>
-
- </div>
-
- <nav class="md-nav" data-md-level="1" aria-labelledby="__nav_7_label" aria-expanded="true">
- <label class="md-nav__title" for="__nav_7">
- <span class="md-nav__icon md-icon"></span>
- Reference
- </label>
- <ul class="md-nav__list" data-md-scrollfix>
-
-
-
-
-
-
-
-
-
-
-
- <li class="md-nav__item md-nav__item--active">
-
- <input class="md-nav__toggle md-toggle" type="checkbox" id="__toc">
-
-
-
-
-
- <label class="md-nav__link md-nav__link--active" for="__toc">
-
-
- <span class="md-ellipsis">
- Agent
- </span>
-
- <span class="md-nav__icon md-icon"></span>
- </label>
-
- <a href="./" class="md-nav__link md-nav__link--active">
-
-
- <span class="md-ellipsis">
- Agent
- </span>
-
- </a>
-
-
- <nav class="md-nav md-nav--secondary" aria-label="Table of contents">
-
-
-
-
-
-
- <label class="md-nav__title" for="__toc">
- <span class="md-nav__icon md-icon"></span>
- Table of contents
- </label>
- <ul class="md-nav__list" data-md-component="toc" data-md-scrollfix>
-
- <li class="md-nav__item">
- <a href="#sweagent.agent.agents" class="md-nav__link">
- <span class="md-ellipsis">
- agents
- </span>
- </a>
-
- </li>
-
- <li class="md-nav__item">
- <a href="#sweagent.agent.agents.Agent" class="md-nav__link">
- <span class="md-ellipsis">
- Agent
- </span>
- </a>
-
- <nav class="md-nav" aria-label="Agent">
- <ul class="md-nav__list">
-
- <li class="md-nav__item">
- <a href="#sweagent.agent.agents.Agent.history" class="md-nav__link">
- <span class="md-ellipsis">
- history
- </span>
- </a>
-
- </li>
-
- <li class="md-nav__item">
- <a href="#sweagent.agent.agents.Agent.info" class="md-nav__link">
- <span class="md-ellipsis">
- info
- </span>
- </a>
-
- </li>
-
- <li class="md-nav__item">
- <a href="#sweagent.agent.agents.Agent.local_history" class="md-nav__link">
- <span class="md-ellipsis">
- local_history
- </span>
- </a>
-
- </li>
-
- <li class="md-nav__item">
- <a href="#sweagent.agent.agents.Agent.state_command" class="md-nav__link">
- <span class="md-ellipsis">
- state_command
- </span>
- </a>
-
- </li>
-
- <li class="md-nav__item">
- <a href="#sweagent.agent.agents.Agent.traj_path" class="md-nav__link">
- <span class="md-ellipsis">
- traj_path
- </span>
- </a>
-
- </li>
-
- <li class="md-nav__item">
- <a href="#sweagent.agent.agents.Agent.trajectory" class="md-nav__link">
- <span class="md-ellipsis">
- trajectory
- </span>
- </a>
-
- </li>
-
- <li class="md-nav__item">
- <a href="#sweagent.agent.agents.Agent.add_hook" class="md-nav__link">
- <span class="md-ellipsis">
- add_hook
- </span>
- </a>
-
- </li>
-
- <li class="md-nav__item">
- <a href="#sweagent.agent.agents.Agent.call_subroutine" class="md-nav__link">
- <span class="md-ellipsis">
- call_subroutine
- </span>
- </a>
-
- </li>
-
- <li class="md-nav__item">
- <a href="#sweagent.agent.agents.Agent.check_format_and_requery" class="md-nav__link">
- <span class="md-ellipsis">
- check_format_and_requery
- </span>
- </a>
-
- </li>
-
- <li class="md-nav__item">
- <a href="#sweagent.agent.agents.Agent.forward" class="md-nav__link">
- <span class="md-ellipsis">
- forward
- </span>
- </a>
-
- </li>
-
- <li class="md-nav__item">
- <a href="#sweagent.agent.agents.Agent.forward_model" class="md-nav__link">
- <span class="md-ellipsis">
- forward_model
- </span>
- </a>
-
- </li>
-
- <li class="md-nav__item">
- <a href="#sweagent.agent.agents.Agent.forward_with_error_check" class="md-nav__link">
- <span class="md-ellipsis">
- forward_with_error_check
- </span>
- </a>
-
- </li>
-
- <li class="md-nav__item">
- <a href="#sweagent.agent.agents.Agent.get_environment_vars" class="md-nav__link">
- <span class="md-ellipsis">
- get_environment_vars
- </span>
- </a>
-
- </li>
-
- <li class="md-nav__item">
- <a href="#sweagent.agent.agents.Agent.retry_after_blocklist_fail" class="md-nav__link">
- <span class="md-ellipsis">
- retry_after_blocklist_fail
- </span>
- </a>
-
- </li>
-
- <li class="md-nav__item">
- <a href="#sweagent.agent.agents.Agent.retry_after_format_fail" class="md-nav__link">
- <span class="md-ellipsis">
- retry_after_format_fail
- </span>
- </a>
-
- </li>
-
- <li class="md-nav__item">
- <a href="#sweagent.agent.agents.Agent.run" class="md-nav__link">
- <span class="md-ellipsis">
- run
- </span>
- </a>
-
- </li>
-
- <li class="md-nav__item">
- <a href="#sweagent.agent.agents.Agent.save_trajectory" class="md-nav__link">
- <span class="md-ellipsis">
- save_trajectory
- </span>
- </a>
-
- </li>
-
- <li class="md-nav__item">
- <a href="#sweagent.agent.agents.Agent.set_environment_vars" class="md-nav__link">
- <span class="md-ellipsis">
- set_environment_vars
- </span>
- </a>
-
- </li>
-
- <li class="md-nav__item">
- <a href="#sweagent.agent.agents.Agent.setup" class="md-nav__link">
- <span class="md-ellipsis">
- setup
- </span>
- </a>
-
- </li>
-
- <li class="md-nav__item">
- <a href="#sweagent.agent.agents.Agent.setup_attempt" class="md-nav__link">
- <span class="md-ellipsis">
- setup_attempt
- </span>
- </a>
-
- </li>
-
- <li class="md-nav__item">
- <a href="#sweagent.agent.agents.Agent.should_block_action" class="md-nav__link">
- <span class="md-ellipsis">
- should_block_action
- </span>
- </a>
-
- </li>
-
- <li class="md-nav__item">
- <a href="#sweagent.agent.agents.Agent.split_actions" class="md-nav__link">
- <span class="md-ellipsis">
- split_actions
- </span>
- </a>
-
- </li>
-
- </ul>
- </nav>
-
- </li>
-
- <li class="md-nav__item">
- <a href="#sweagent.agent.agents.AgentArguments" class="md-nav__link">
- <span class="md-ellipsis">
- AgentArguments
- </span>
- </a>
-
- </li>
-
- <li class="md-nav__item">
- <a href="#sweagent.agent.agents.AgentHook" class="md-nav__link">
- <span class="md-ellipsis">
- AgentHook
- </span>
- </a>
-
- <nav class="md-nav" aria-label="AgentHook">
- <ul class="md-nav__list">
-
- <li class="md-nav__item">
- <a href="#sweagent.agent.agents.AgentHook.on_init" class="md-nav__link">
- <span class="md-ellipsis">
- on_init
- </span>
- </a>
-
- </li>
-
- <li class="md-nav__item">
- <a href="#sweagent.agent.agents.AgentHook.on_model_query" class="md-nav__link">
- <span class="md-ellipsis">
- on_model_query
- </span>
- </a>
-
- </li>
-
- </ul>
- </nav>
-
- </li>
-
- </ul>
-
- </nav>
-
- </li>
-
-
-
-
-
-
-
-
-
- <li class="md-nav__item">
- <a href="../models/" class="md-nav__link">
-
-
- <span class="md-ellipsis">
- Models
- </span>
-
- </a>
- </li>
-
-
-
-
-
-
-
-
-
- <li class="md-nav__item">
- <a href="../env/" class="md-nav__link">
-
-
- <span class="md-ellipsis">
- Environment
- </span>
-
- </a>
- </li>
-
-
-
-
-
-
-
-
-
- <li class="md-nav__item">
- <a href="../env_utils/" class="md-nav__link">
-
-
- <span class="md-ellipsis">
- Environment utils
- </span>
-
- </a>
- </li>
-
-
-
- </ul>
- </nav>
-
- </li>
-
-
-
-
-
-
-
-
- <li class="md-nav__item">
- <a href="../../faq/" class="md-nav__link">
-
-
- <span class="md-ellipsis">
- FAQ
- </span>
-
- </a>
- </li>
-
-
- </ul>
- </nav>
- </div>
- </div>
- </div>
-
-
-
- <div class="md-sidebar md-sidebar--secondary" data-md-component="sidebar" data-md-type="toc" >
- <div class="md-sidebar__scrollwrap">
- <div class="md-sidebar__inner">
-
- <nav class="md-nav md-nav--secondary" aria-label="Table of contents">
-
-
-
-
-
-
- <label class="md-nav__title" for="__toc">
- <span class="md-nav__icon md-icon"></span>
- Table of contents
- </label>
- <ul class="md-nav__list" data-md-component="toc" data-md-scrollfix>
-
- <li class="md-nav__item">
- <a href="#sweagent.agent.agents" class="md-nav__link">
- <span class="md-ellipsis">
- agents
- </span>
- </a>
-
- </li>
-
- <li class="md-nav__item">
- <a href="#sweagent.agent.agents.Agent" class="md-nav__link">
- <span class="md-ellipsis">
- Agent
- </span>
- </a>
-
- <nav class="md-nav" aria-label="Agent">
- <ul class="md-nav__list">
-
- <li class="md-nav__item">
- <a href="#sweagent.agent.agents.Agent.history" class="md-nav__link">
- <span class="md-ellipsis">
- history
- </span>
- </a>
-
- </li>
-
- <li class="md-nav__item">
- <a href="#sweagent.agent.agents.Agent.info" class="md-nav__link">
- <span class="md-ellipsis">
- info
- </span>
- </a>
-
- </li>
-
- <li class="md-nav__item">
- <a href="#sweagent.agent.agents.Agent.local_history" class="md-nav__link">
- <span class="md-ellipsis">
- local_history
- </span>
- </a>
-
- </li>
-
- <li class="md-nav__item">
- <a href="#sweagent.agent.agents.Agent.state_command" class="md-nav__link">
- <span class="md-ellipsis">
- state_command
- </span>
- </a>
-
- </li>
-
- <li class="md-nav__item">
- <a href="#sweagent.agent.agents.Agent.traj_path" class="md-nav__link">
- <span class="md-ellipsis">
- traj_path
- </span>
- </a>
-
- </li>
-
- <li class="md-nav__item">
- <a href="#sweagent.agent.agents.Agent.trajectory" class="md-nav__link">
- <span class="md-ellipsis">
- trajectory
- </span>
- </a>
-
- </li>
-
- <li class="md-nav__item">
- <a href="#sweagent.agent.agents.Agent.add_hook" class="md-nav__link">
- <span class="md-ellipsis">
- add_hook
- </span>
- </a>
-
- </li>
-
- <li class="md-nav__item">
- <a href="#sweagent.agent.agents.Agent.call_subroutine" class="md-nav__link">
- <span class="md-ellipsis">
- call_subroutine
- </span>
- </a>
-
- </li>
-
- <li class="md-nav__item">
- <a href="#sweagent.agent.agents.Agent.check_format_and_requery" class="md-nav__link">
- <span class="md-ellipsis">
- check_format_and_requery
- </span>
- </a>
-
- </li>
-
- <li class="md-nav__item">
- <a href="#sweagent.agent.agents.Agent.forward" class="md-nav__link">
- <span class="md-ellipsis">
- forward
- </span>
- </a>
-
- </li>
-
- <li class="md-nav__item">
- <a href="#sweagent.agent.agents.Agent.forward_model" class="md-nav__link">
- <span class="md-ellipsis">
- forward_model
- </span>
- </a>
-
- </li>
-
- <li class="md-nav__item">
- <a href="#sweagent.agent.agents.Agent.forward_with_error_check" class="md-nav__link">
- <span class="md-ellipsis">
- forward_with_error_check
- </span>
- </a>
-
- </li>
-
- <li class="md-nav__item">
- <a href="#sweagent.agent.agents.Agent.get_environment_vars" class="md-nav__link">
- <span class="md-ellipsis">
- get_environment_vars
- </span>
- </a>
-
- </li>
-
- <li class="md-nav__item">
- <a href="#sweagent.agent.agents.Agent.retry_after_blocklist_fail" class="md-nav__link">
- <span class="md-ellipsis">
- retry_after_blocklist_fail
- </span>
- </a>
-
- </li>
-
- <li class="md-nav__item">
- <a href="#sweagent.agent.agents.Agent.retry_after_format_fail" class="md-nav__link">
- <span class="md-ellipsis">
- retry_after_format_fail
- </span>
- </a>
-
- </li>
-
- <li class="md-nav__item">
- <a href="#sweagent.agent.agents.Agent.run" class="md-nav__link">
- <span class="md-ellipsis">
- run
- </span>
- </a>
-
- </li>
-
- <li class="md-nav__item">
- <a href="#sweagent.agent.agents.Agent.save_trajectory" class="md-nav__link">
- <span class="md-ellipsis">
- save_trajectory
- </span>
- </a>
-
- </li>
-
- <li class="md-nav__item">
- <a href="#sweagent.agent.agents.Agent.set_environment_vars" class="md-nav__link">
- <span class="md-ellipsis">
- set_environment_vars
- </span>
- </a>
-
- </li>
-
- <li class="md-nav__item">
- <a href="#sweagent.agent.agents.Agent.setup" class="md-nav__link">
- <span class="md-ellipsis">
- setup
- </span>
- </a>
-
- </li>
-
- <li class="md-nav__item">
- <a href="#sweagent.agent.agents.Agent.setup_attempt" class="md-nav__link">
- <span class="md-ellipsis">
- setup_attempt
- </span>
- </a>
-
- </li>
-
- <li class="md-nav__item">
- <a href="#sweagent.agent.agents.Agent.should_block_action" class="md-nav__link">
- <span class="md-ellipsis">
- should_block_action
- </span>
- </a>
-
- </li>
-
- <li class="md-nav__item">
- <a href="#sweagent.agent.agents.Agent.split_actions" class="md-nav__link">
- <span class="md-ellipsis">
- split_actions
- </span>
- </a>
-
- </li>
-
- </ul>
- </nav>
-
- </li>
-
- <li class="md-nav__item">
- <a href="#sweagent.agent.agents.AgentArguments" class="md-nav__link">
- <span class="md-ellipsis">
- AgentArguments
- </span>
- </a>
-
- </li>
-
- <li class="md-nav__item">
- <a href="#sweagent.agent.agents.AgentHook" class="md-nav__link">
- <span class="md-ellipsis">
- AgentHook
- </span>
- </a>
-
- <nav class="md-nav" aria-label="AgentHook">
- <ul class="md-nav__list">
-
- <li class="md-nav__item">
- <a href="#sweagent.agent.agents.AgentHook.on_init" class="md-nav__link">
- <span class="md-ellipsis">
- on_init
- </span>
- </a>
-
- </li>
-
- <li class="md-nav__item">
- <a href="#sweagent.agent.agents.AgentHook.on_model_query" class="md-nav__link">
- <span class="md-ellipsis">
- on_model_query
- </span>
- </a>
-
- </li>
-
- </ul>
- </nav>
-
- </li>
-
- </ul>
-
- </nav>
- </div>
- </div>
- </div>
-
-
-
- <div class="md-content" data-md-component="content">
- <article class="md-content__inner md-typeset">
-
-
-
- <a href="https://github.com/princeton-nlp/SWE-agent/edit/main/docs/reference/agent.md" title="Edit this page" class="md-content__button md-icon">
-
- <svg xmlns="http://www.w3.org/2000/svg" viewBox="0 0 24 24"><path d="M10 20H6V4h7v5h5v3.1l2-2V8l-6-6H6c-1.1 0-2 .9-2 2v16c0 1.1.9 2 2 2h4zm10.2-7c.1 0 .3.1.4.2l1.3 1.3c.2.2.2.6 0 .8l-1 1-2.1-2.1 1-1c.1-.1.2-.2.4-.2m0 3.9L14.1 23H12v-2.1l6.1-6.1z"/></svg>
- </a>
-
-
- <h1 id="the-agent-class">The agent class</h1>
- <div class="doc doc-object doc-module">
- <a id="sweagent.agent.agents"></a>
- <div class="doc doc-contents first">
- <div class="doc doc-children">
- <div class="doc doc-object doc-class">
- <h2 id="sweagent.agent.agents.Agent" class="doc doc-heading">
- <code>Agent</code>
- </h2>
- <div class="doc doc-contents ">
- <p>Agent handles the behaviour of the model and how it interacts with the environment.</p>
- <details class="quote">
- <summary>Source code in <code>sweagent/agent/agents.py</code></summary>
- <div class="highlight"><table class="highlighttable"><tr><td class="linenos"><div class="linenodiv"><pre><span></span><span class="normal"> 263</span>
- <span class="normal"> 264</span>
- <span class="normal"> 265</span>
- <span class="normal"> 266</span>
- <span class="normal"> 267</span>
- <span class="normal"> 268</span>
- <span class="normal"> 269</span>
- <span class="normal"> 270</span>
- <span class="normal"> 271</span>
- <span class="normal"> 272</span>
- <span class="normal"> 273</span>
- <span class="normal"> 274</span>
- <span class="normal"> 275</span>
- <span class="normal"> 276</span>
- <span class="normal"> 277</span>
- <span class="normal"> 278</span>
- <span class="normal"> 279</span>
- <span class="normal"> 280</span>
- <span class="normal"> 281</span>
- <span class="normal"> 282</span>
- <span class="normal"> 283</span>
- <span class="normal"> 284</span>
- <span class="normal"> 285</span>
- <span class="normal"> 286</span>
- <span class="normal"> 287</span>
- <span class="normal"> 288</span>
- <span class="normal"> 289</span>
- <span class="normal"> 290</span>
- <span class="normal"> 291</span>
- <span class="normal"> 292</span>
- <span class="normal"> 293</span>
- <span class="normal"> 294</span>
- <span class="normal"> 295</span>
- <span class="normal"> 296</span>
- <span class="normal"> 297</span>
- <span class="normal"> 298</span>
- <span class="normal"> 299</span>
- <span class="normal"> 300</span>
- <span class="normal"> 301</span>
- <span class="normal"> 302</span>
- <span class="normal"> 303</span>
- <span class="normal"> 304</span>
- <span class="normal"> 305</span>
- <span class="normal"> 306</span>
- <span class="normal"> 307</span>
- <span class="normal"> 308</span>
- <span class="normal"> 309</span>
- <span class="normal"> 310</span>
- <span class="normal"> 311</span>
- <span class="normal"> 312</span>
- <span class="normal"> 313</span>
- <span class="normal"> 314</span>
- <span class="normal"> 315</span>
- <span class="normal"> 316</span>
- <span class="normal"> 317</span>
- <span class="normal"> 318</span>
- <span class="normal"> 319</span>
- <span class="normal"> 320</span>
- <span class="normal"> 321</span>
- <span class="normal"> 322</span>
- <span class="normal"> 323</span>
- <span class="normal"> 324</span>
- <span class="normal"> 325</span>
- <span class="normal"> 326</span>
- <span class="normal"> 327</span>
- <span class="normal"> 328</span>
- <span class="normal"> 329</span>
- <span class="normal"> 330</span>
- <span class="normal"> 331</span>
- <span class="normal"> 332</span>
- <span class="normal"> 333</span>
- <span class="normal"> 334</span>
- <span class="normal"> 335</span>
- <span class="normal"> 336</span>
- <span class="normal"> 337</span>
- <span class="normal"> 338</span>
- <span class="normal"> 339</span>
- <span class="normal"> 340</span>
- <span class="normal"> 341</span>
- <span class="normal"> 342</span>
- <span class="normal"> 343</span>
- <span class="normal"> 344</span>
- <span class="normal"> 345</span>
- <span class="normal"> 346</span>
- <span class="normal"> 347</span>
- <span class="normal"> 348</span>
- <span class="normal"> 349</span>
- <span class="normal"> 350</span>
- <span class="normal"> 351</span>
- <span class="normal"> 352</span>
- <span class="normal"> 353</span>
- <span class="normal"> 354</span>
- <span class="normal"> 355</span>
- <span class="normal"> 356</span>
- <span class="normal"> 357</span>
- <span class="normal"> 358</span>
- <span class="normal"> 359</span>
- <span class="normal"> 360</span>
- <span class="normal"> 361</span>
- <span class="normal"> 362</span>
- <span class="normal"> 363</span>
- <span class="normal"> 364</span>
- <span class="normal"> 365</span>
- <span class="normal"> 366</span>
- <span class="normal"> 367</span>
- <span class="normal"> 368</span>
- <span class="normal"> 369</span>
- <span class="normal"> 370</span>
- <span class="normal"> 371</span>
- <span class="normal"> 372</span>
- <span class="normal"> 373</span>
- <span class="normal"> 374</span>
- <span class="normal"> 375</span>
- <span class="normal"> 376</span>
- <span class="normal"> 377</span>
- <span class="normal"> 378</span>
- <span class="normal"> 379</span>
- <span class="normal"> 380</span>
- <span class="normal"> 381</span>
- <span class="normal"> 382</span>
- <span class="normal"> 383</span>
- <span class="normal"> 384</span>
- <span class="normal"> 385</span>
- <span class="normal"> 386</span>
- <span class="normal"> 387</span>
- <span class="normal"> 388</span>
- <span class="normal"> 389</span>
- <span class="normal"> 390</span>
- <span class="normal"> 391</span>
- <span class="normal"> 392</span>
- <span class="normal"> 393</span>
- <span class="normal"> 394</span>
- <span class="normal"> 395</span>
- <span class="normal"> 396</span>
- <span class="normal"> 397</span>
- <span class="normal"> 398</span>
- <span class="normal"> 399</span>
- <span class="normal"> 400</span>
- <span class="normal"> 401</span>
- <span class="normal"> 402</span>
- <span class="normal"> 403</span>
- <span class="normal"> 404</span>
- <span class="normal"> 405</span>
- <span class="normal"> 406</span>
- <span class="normal"> 407</span>
- <span class="normal"> 408</span>
- <span class="normal"> 409</span>
- <span class="normal"> 410</span>
- <span class="normal"> 411</span>
- <span class="normal"> 412</span>
- <span class="normal"> 413</span>
- <span class="normal"> 414</span>
- <span class="normal"> 415</span>
- <span class="normal"> 416</span>
- <span class="normal"> 417</span>
- <span class="normal"> 418</span>
- <span class="normal"> 419</span>
- <span class="normal"> 420</span>
- <span class="normal"> 421</span>
- <span class="normal"> 422</span>
- <span class="normal"> 423</span>
- <span class="normal"> 424</span>
- <span class="normal"> 425</span>
- <span class="normal"> 426</span>
- <span class="normal"> 427</span>
- <span class="normal"> 428</span>
- <span class="normal"> 429</span>
- <span class="normal"> 430</span>
- <span class="normal"> 431</span>
- <span class="normal"> 432</span>
- <span class="normal"> 433</span>
- <span class="normal"> 434</span>
- <span class="normal"> 435</span>
- <span class="normal"> 436</span>
- <span class="normal"> 437</span>
- <span class="normal"> 438</span>
- <span class="normal"> 439</span>
- <span class="normal"> 440</span>
- <span class="normal"> 441</span>
- <span class="normal"> 442</span>
- <span class="normal"> 443</span>
- <span class="normal"> 444</span>
- <span class="normal"> 445</span>
- <span class="normal"> 446</span>
- <span class="normal"> 447</span>
- <span class="normal"> 448</span>
- <span class="normal"> 449</span>
- <span class="normal"> 450</span>
- <span class="normal"> 451</span>
- <span class="normal"> 452</span>
- <span class="normal"> 453</span>
- <span class="normal"> 454</span>
- <span class="normal"> 455</span>
- <span class="normal"> 456</span>
- <span class="normal"> 457</span>
- <span class="normal"> 458</span>
- <span class="normal"> 459</span>
- <span class="normal"> 460</span>
- <span class="normal"> 461</span>
- <span class="normal"> 462</span>
- <span class="normal"> 463</span>
- <span class="normal"> 464</span>
- <span class="normal"> 465</span>
- <span class="normal"> 466</span>
- <span class="normal"> 467</span>
- <span class="normal"> 468</span>
- <span class="normal"> 469</span>
- <span class="normal"> 470</span>
- <span class="normal"> 471</span>
- <span class="normal"> 472</span>
- <span class="normal"> 473</span>
- <span class="normal"> 474</span>
- <span class="normal"> 475</span>
- <span class="normal"> 476</span>
- <span class="normal"> 477</span>
- <span class="normal"> 478</span>
- <span class="normal"> 479</span>
- <span class="normal"> 480</span>
- <span class="normal"> 481</span>
- <span class="normal"> 482</span>
- <span class="normal"> 483</span>
- <span class="normal"> 484</span>
- <span class="normal"> 485</span>
- <span class="normal"> 486</span>
- <span class="normal"> 487</span>
- <span class="normal"> 488</span>
- <span class="normal"> 489</span>
- <span class="normal"> 490</span>
- <span class="normal"> 491</span>
- <span class="normal"> 492</span>
- <span class="normal"> 493</span>
- <span class="normal"> 494</span>
- <span class="normal"> 495</span>
- <span class="normal"> 496</span>
- <span class="normal"> 497</span>
- <span class="normal"> 498</span>
- <span class="normal"> 499</span>
- <span class="normal"> 500</span>
- <span class="normal"> 501</span>
- <span class="normal"> 502</span>
- <span class="normal"> 503</span>
- <span class="normal"> 504</span>
- <span class="normal"> 505</span>
- <span class="normal"> 506</span>
- <span class="normal"> 507</span>
- <span class="normal"> 508</span>
- <span class="normal"> 509</span>
- <span class="normal"> 510</span>
- <span class="normal"> 511</span>
- <span class="normal"> 512</span>
- <span class="normal"> 513</span>
- <span class="normal"> 514</span>
- <span class="normal"> 515</span>
- <span class="normal"> 516</span>
- <span class="normal"> 517</span>
- <span class="normal"> 518</span>
- <span class="normal"> 519</span>
- <span class="normal"> 520</span>
- <span class="normal"> 521</span>
- <span class="normal"> 522</span>
- <span class="normal"> 523</span>
- <span class="normal"> 524</span>
- <span class="normal"> 525</span>
- <span class="normal"> 526</span>
- <span class="normal"> 527</span>
- <span class="normal"> 528</span>
- <span class="normal"> 529</span>
- <span class="normal"> 530</span>
- <span class="normal"> 531</span>
- <span class="normal"> 532</span>
- <span class="normal"> 533</span>
- <span class="normal"> 534</span>
- <span class="normal"> 535</span>
- <span class="normal"> 536</span>
- <span class="normal"> 537</span>
- <span class="normal"> 538</span>
- <span class="normal"> 539</span>
- <span class="normal"> 540</span>
- <span class="normal"> 541</span>
- <span class="normal"> 542</span>
- <span class="normal"> 543</span>
- <span class="normal"> 544</span>
- <span class="normal"> 545</span>
- <span class="normal"> 546</span>
- <span class="normal"> 547</span>
- <span class="normal"> 548</span>
- <span class="normal"> 549</span>
- <span class="normal"> 550</span>
- <span class="normal"> 551</span>
- <span class="normal"> 552</span>
- <span class="normal"> 553</span>
- <span class="normal"> 554</span>
- <span class="normal"> 555</span>
- <span class="normal"> 556</span>
- <span class="normal"> 557</span>
- <span class="normal"> 558</span>
- <span class="normal"> 559</span>
- <span class="normal"> 560</span>
- <span class="normal"> 561</span>
- <span class="normal"> 562</span>
- <span class="normal"> 563</span>
- <span class="normal"> 564</span>
- <span class="normal"> 565</span>
- <span class="normal"> 566</span>
- <span class="normal"> 567</span>
- <span class="normal"> 568</span>
- <span class="normal"> 569</span>
- <span class="normal"> 570</span>
- <span class="normal"> 571</span>
- <span class="normal"> 572</span>
- <span class="normal"> 573</span>
- <span class="normal"> 574</span>
- <span class="normal"> 575</span>
- <span class="normal"> 576</span>
- <span class="normal"> 577</span>
- <span class="normal"> 578</span>
- <span class="normal"> 579</span>
- <span class="normal"> 580</span>
- <span class="normal"> 581</span>
- <span class="normal"> 582</span>
- <span class="normal"> 583</span>
- <span class="normal"> 584</span>
- <span class="normal"> 585</span>
- <span class="normal"> 586</span>
- <span class="normal"> 587</span>
- <span class="normal"> 588</span>
- <span class="normal"> 589</span>
- <span class="normal"> 590</span>
- <span class="normal"> 591</span>
- <span class="normal"> 592</span>
- <span class="normal"> 593</span>
- <span class="normal"> 594</span>
- <span class="normal"> 595</span>
- <span class="normal"> 596</span>
- <span class="normal"> 597</span>
- <span class="normal"> 598</span>
- <span class="normal"> 599</span>
- <span class="normal"> 600</span>
- <span class="normal"> 601</span>
- <span class="normal"> 602</span>
- <span class="normal"> 603</span>
- <span class="normal"> 604</span>
- <span class="normal"> 605</span>
- <span class="normal"> 606</span>
- <span class="normal"> 607</span>
- <span class="normal"> 608</span>
- <span class="normal"> 609</span>
- <span class="normal"> 610</span>
- <span class="normal"> 611</span>
- <span class="normal"> 612</span>
- <span class="normal"> 613</span>
- <span class="normal"> 614</span>
- <span class="normal"> 615</span>
- <span class="normal"> 616</span>
- <span class="normal"> 617</span>
- <span class="normal"> 618</span>
- <span class="normal"> 619</span>
- <span class="normal"> 620</span>
- <span class="normal"> 621</span>
- <span class="normal"> 622</span>
- <span class="normal"> 623</span>
- <span class="normal"> 624</span>
- <span class="normal"> 625</span>
- <span class="normal"> 626</span>
- <span class="normal"> 627</span>
- <span class="normal"> 628</span>
- <span class="normal"> 629</span>
- <span class="normal"> 630</span>
- <span class="normal"> 631</span>
- <span class="normal"> 632</span>
- <span class="normal"> 633</span>
- <span class="normal"> 634</span>
- <span class="normal"> 635</span>
- <span class="normal"> 636</span>
- <span class="normal"> 637</span>
- <span class="normal"> 638</span>
- <span class="normal"> 639</span>
- <span class="normal"> 640</span>
- <span class="normal"> 641</span>
- <span class="normal"> 642</span>
- <span class="normal"> 643</span>
- <span class="normal"> 644</span>
- <span class="normal"> 645</span>
- <span class="normal"> 646</span>
- <span class="normal"> 647</span>
- <span class="normal"> 648</span>
- <span class="normal"> 649</span>
- <span class="normal"> 650</span>
- <span class="normal"> 651</span>
- <span class="normal"> 652</span>
- <span class="normal"> 653</span>
- <span class="normal"> 654</span>
- <span class="normal"> 655</span>
- <span class="normal"> 656</span>
- <span class="normal"> 657</span>
- <span class="normal"> 658</span>
- <span class="normal"> 659</span>
- <span class="normal"> 660</span>
- <span class="normal"> 661</span>
- <span class="normal"> 662</span>
- <span class="normal"> 663</span>
- <span class="normal"> 664</span>
- <span class="normal"> 665</span>
- <span class="normal"> 666</span>
- <span class="normal"> 667</span>
- <span class="normal"> 668</span>
- <span class="normal"> 669</span>
- <span class="normal"> 670</span>
- <span class="normal"> 671</span>
- <span class="normal"> 672</span>
- <span class="normal"> 673</span>
- <span class="normal"> 674</span>
- <span class="normal"> 675</span>
- <span class="normal"> 676</span>
- <span class="normal"> 677</span>
- <span class="normal"> 678</span>
- <span class="normal"> 679</span>
- <span class="normal"> 680</span>
- <span class="normal"> 681</span>
- <span class="normal"> 682</span>
- <span class="normal"> 683</span>
- <span class="normal"> 684</span>
- <span class="normal"> 685</span>
- <span class="normal"> 686</span>
- <span class="normal"> 687</span>
- <span class="normal"> 688</span>
- <span class="normal"> 689</span>
- <span class="normal"> 690</span>
- <span class="normal"> 691</span>
- <span class="normal"> 692</span>
- <span class="normal"> 693</span>
- <span class="normal"> 694</span>
- <span class="normal"> 695</span>
- <span class="normal"> 696</span>
- <span class="normal"> 697</span>
- <span class="normal"> 698</span>
- <span class="normal"> 699</span>
- <span class="normal"> 700</span>
- <span class="normal"> 701</span>
- <span class="normal"> 702</span>
- <span class="normal"> 703</span>
- <span class="normal"> 704</span>
- <span class="normal"> 705</span>
- <span class="normal"> 706</span>
- <span class="normal"> 707</span>
- <span class="normal"> 708</span>
- <span class="normal"> 709</span>
- <span class="normal"> 710</span>
- <span class="normal"> 711</span>
- <span class="normal"> 712</span>
- <span class="normal"> 713</span>
- <span class="normal"> 714</span>
- <span class="normal"> 715</span>
- <span class="normal"> 716</span>
- <span class="normal"> 717</span>
- <span class="normal"> 718</span>
- <span class="normal"> 719</span>
- <span class="normal"> 720</span>
- <span class="normal"> 721</span>
- <span class="normal"> 722</span>
- <span class="normal"> 723</span>
- <span class="normal"> 724</span>
- <span class="normal"> 725</span>
- <span class="normal"> 726</span>
- <span class="normal"> 727</span>
- <span class="normal"> 728</span>
- <span class="normal"> 729</span>
- <span class="normal"> 730</span>
- <span class="normal"> 731</span>
- <span class="normal"> 732</span>
- <span class="normal"> 733</span>
- <span class="normal"> 734</span>
- <span class="normal"> 735</span>
- <span class="normal"> 736</span>
- <span class="normal"> 737</span>
- <span class="normal"> 738</span>
- <span class="normal"> 739</span>
- <span class="normal"> 740</span>
- <span class="normal"> 741</span>
- <span class="normal"> 742</span>
- <span class="normal"> 743</span>
- <span class="normal"> 744</span>
- <span class="normal"> 745</span>
- <span class="normal"> 746</span>
- <span class="normal"> 747</span>
- <span class="normal"> 748</span>
- <span class="normal"> 749</span>
- <span class="normal"> 750</span>
- <span class="normal"> 751</span>
- <span class="normal"> 752</span>
- <span class="normal"> 753</span>
- <span class="normal"> 754</span>
- <span class="normal"> 755</span>
- <span class="normal"> 756</span>
- <span class="normal"> 757</span>
- <span class="normal"> 758</span>
- <span class="normal"> 759</span>
- <span class="normal"> 760</span>
- <span class="normal"> 761</span>
- <span class="normal"> 762</span>
- <span class="normal"> 763</span>
- <span class="normal"> 764</span>
- <span class="normal"> 765</span>
- <span class="normal"> 766</span>
- <span class="normal"> 767</span>
- <span class="normal"> 768</span>
- <span class="normal"> 769</span>
- <span class="normal"> 770</span>
- <span class="normal"> 771</span>
- <span class="normal"> 772</span>
- <span class="normal"> 773</span>
- <span class="normal"> 774</span>
- <span class="normal"> 775</span>
- <span class="normal"> 776</span>
- <span class="normal"> 777</span>
- <span class="normal"> 778</span>
- <span class="normal"> 779</span>
- <span class="normal"> 780</span>
- <span class="normal"> 781</span>
- <span class="normal"> 782</span>
- <span class="normal"> 783</span>
- <span class="normal"> 784</span>
- <span class="normal"> 785</span>
- <span class="normal"> 786</span>
- <span class="normal"> 787</span>
- <span class="normal"> 788</span>
- <span class="normal"> 789</span>
- <span class="normal"> 790</span>
- <span class="normal"> 791</span>
- <span class="normal"> 792</span>
- <span class="normal"> 793</span>
- <span class="normal"> 794</span>
- <span class="normal"> 795</span>
- <span class="normal"> 796</span>
- <span class="normal"> 797</span>
- <span class="normal"> 798</span>
- <span class="normal"> 799</span>
- <span class="normal"> 800</span>
- <span class="normal"> 801</span>
- <span class="normal"> 802</span>
- <span class="normal"> 803</span>
- <span class="normal"> 804</span>
- <span class="normal"> 805</span>
- <span class="normal"> 806</span>
- <span class="normal"> 807</span>
- <span class="normal"> 808</span>
- <span class="normal"> 809</span>
- <span class="normal"> 810</span>
- <span class="normal"> 811</span>
- <span class="normal"> 812</span>
- <span class="normal"> 813</span>
- <span class="normal"> 814</span>
- <span class="normal"> 815</span>
- <span class="normal"> 816</span>
- <span class="normal"> 817</span>
- <span class="normal"> 818</span>
- <span class="normal"> 819</span>
- <span class="normal"> 820</span>
- <span class="normal"> 821</span>
- <span class="normal"> 822</span>
- <span class="normal"> 823</span>
- <span class="normal"> 824</span>
- <span class="normal"> 825</span>
- <span class="normal"> 826</span>
- <span class="normal"> 827</span>
- <span class="normal"> 828</span>
- <span class="normal"> 829</span>
- <span class="normal"> 830</span>
- <span class="normal"> 831</span>
- <span class="normal"> 832</span>
- <span class="normal"> 833</span>
- <span class="normal"> 834</span>
- <span class="normal"> 835</span>
- <span class="normal"> 836</span>
- <span class="normal"> 837</span>
- <span class="normal"> 838</span>
- <span class="normal"> 839</span>
- <span class="normal"> 840</span>
- <span class="normal"> 841</span>
- <span class="normal"> 842</span>
- <span class="normal"> 843</span>
- <span class="normal"> 844</span>
- <span class="normal"> 845</span>
- <span class="normal"> 846</span>
- <span class="normal"> 847</span>
- <span class="normal"> 848</span>
- <span class="normal"> 849</span>
- <span class="normal"> 850</span>
- <span class="normal"> 851</span>
- <span class="normal"> 852</span>
- <span class="normal"> 853</span>
- <span class="normal"> 854</span>
- <span class="normal"> 855</span>
- <span class="normal"> 856</span>
- <span class="normal"> 857</span>
- <span class="normal"> 858</span>
- <span class="normal"> 859</span>
- <span class="normal"> 860</span>
- <span class="normal"> 861</span>
- <span class="normal"> 862</span>
- <span class="normal"> 863</span>
- <span class="normal"> 864</span>
- <span class="normal"> 865</span>
- <span class="normal"> 866</span>
- <span class="normal"> 867</span>
- <span class="normal"> 868</span>
- <span class="normal"> 869</span>
- <span class="normal"> 870</span>
- <span class="normal"> 871</span>
- <span class="normal"> 872</span>
- <span class="normal"> 873</span>
- <span class="normal"> 874</span>
- <span class="normal"> 875</span>
- <span class="normal"> 876</span>
- <span class="normal"> 877</span>
- <span class="normal"> 878</span>
- <span class="normal"> 879</span>
- <span class="normal"> 880</span>
- <span class="normal"> 881</span>
- <span class="normal"> 882</span>
- <span class="normal"> 883</span>
- <span class="normal"> 884</span>
- <span class="normal"> 885</span>
- <span class="normal"> 886</span>
- <span class="normal"> 887</span>
- <span class="normal"> 888</span>
- <span class="normal"> 889</span>
- <span class="normal"> 890</span>
- <span class="normal"> 891</span>
- <span class="normal"> 892</span>
- <span class="normal"> 893</span>
- <span class="normal"> 894</span>
- <span class="normal"> 895</span>
- <span class="normal"> 896</span>
- <span class="normal"> 897</span>
- <span class="normal"> 898</span>
- <span class="normal"> 899</span>
- <span class="normal"> 900</span>
- <span class="normal"> 901</span>
- <span class="normal"> 902</span>
- <span class="normal"> 903</span>
- <span class="normal"> 904</span>
- <span class="normal"> 905</span>
- <span class="normal"> 906</span>
- <span class="normal"> 907</span>
- <span class="normal"> 908</span>
- <span class="normal"> 909</span>
- <span class="normal"> 910</span>
- <span class="normal"> 911</span>
- <span class="normal"> 912</span>
- <span class="normal"> 913</span>
- <span class="normal"> 914</span>
- <span class="normal"> 915</span>
- <span class="normal"> 916</span>
- <span class="normal"> 917</span>
- <span class="normal"> 918</span>
- <span class="normal"> 919</span>
- <span class="normal"> 920</span>
- <span class="normal"> 921</span>
- <span class="normal"> 922</span>
- <span class="normal"> 923</span>
- <span class="normal"> 924</span>
- <span class="normal"> 925</span>
- <span class="normal"> 926</span>
- <span class="normal"> 927</span>
- <span class="normal"> 928</span>
- <span class="normal"> 929</span>
- <span class="normal"> 930</span>
- <span class="normal"> 931</span>
- <span class="normal"> 932</span>
- <span class="normal"> 933</span>
- <span class="normal"> 934</span>
- <span class="normal"> 935</span>
- <span class="normal"> 936</span>
- <span class="normal"> 937</span>
- <span class="normal"> 938</span>
- <span class="normal"> 939</span>
- <span class="normal"> 940</span>
- <span class="normal"> 941</span>
- <span class="normal"> 942</span>
- <span class="normal"> 943</span>
- <span class="normal"> 944</span>
- <span class="normal"> 945</span>
- <span class="normal"> 946</span>
- <span class="normal"> 947</span>
- <span class="normal"> 948</span>
- <span class="normal"> 949</span>
- <span class="normal"> 950</span>
- <span class="normal"> 951</span>
- <span class="normal"> 952</span>
- <span class="normal"> 953</span>
- <span class="normal"> 954</span>
- <span class="normal"> 955</span>
- <span class="normal"> 956</span>
- <span class="normal"> 957</span>
- <span class="normal"> 958</span>
- <span class="normal"> 959</span>
- <span class="normal"> 960</span>
- <span class="normal"> 961</span>
- <span class="normal"> 962</span>
- <span class="normal"> 963</span>
- <span class="normal"> 964</span>
- <span class="normal"> 965</span>
- <span class="normal"> 966</span>
- <span class="normal"> 967</span>
- <span class="normal"> 968</span>
- <span class="normal"> 969</span>
- <span class="normal"> 970</span>
- <span class="normal"> 971</span>
- <span class="normal"> 972</span>
- <span class="normal"> 973</span>
- <span class="normal"> 974</span>
- <span class="normal"> 975</span>
- <span class="normal"> 976</span>
- <span class="normal"> 977</span>
- <span class="normal"> 978</span>
- <span class="normal"> 979</span>
- <span class="normal"> 980</span>
- <span class="normal"> 981</span>
- <span class="normal"> 982</span>
- <span class="normal"> 983</span>
- <span class="normal"> 984</span>
- <span class="normal"> 985</span>
- <span class="normal"> 986</span>
- <span class="normal"> 987</span>
- <span class="normal"> 988</span>
- <span class="normal"> 989</span>
- <span class="normal"> 990</span>
- <span class="normal"> 991</span>
- <span class="normal"> 992</span>
- <span class="normal"> 993</span>
- <span class="normal"> 994</span>
- <span class="normal"> 995</span>
- <span class="normal"> 996</span>
- <span class="normal"> 997</span>
- <span class="normal"> 998</span>
- <span class="normal"> 999</span>
- <span class="normal">1000</span>
- <span class="normal">1001</span>
- <span class="normal">1002</span>
- <span class="normal">1003</span>
- <span class="normal">1004</span>
- <span class="normal">1005</span>
- <span class="normal">1006</span>
- <span class="normal">1007</span>
- <span class="normal">1008</span>
- <span class="normal">1009</span>
- <span class="normal">1010</span>
- <span class="normal">1011</span>
- <span class="normal">1012</span>
- <span class="normal">1013</span>
- <span class="normal">1014</span>
- <span class="normal">1015</span>
- <span class="normal">1016</span>
- <span class="normal">1017</span>
- <span class="normal">1018</span>
- <span class="normal">1019</span>
- <span class="normal">1020</span>
- <span class="normal">1021</span>
- <span class="normal">1022</span>
- <span class="normal">1023</span>
- <span class="normal">1024</span>
- <span class="normal">1025</span>
- <span class="normal">1026</span>
- <span class="normal">1027</span>
- <span class="normal">1028</span>
- <span class="normal">1029</span>
- <span class="normal">1030</span>
- <span class="normal">1031</span>
- <span class="normal">1032</span>
- <span class="normal">1033</span>
- <span class="normal">1034</span>
- <span class="normal">1035</span>
- <span class="normal">1036</span>
- <span class="normal">1037</span>
- <span class="normal">1038</span>
- <span class="normal">1039</span>
- <span class="normal">1040</span>
- <span class="normal">1041</span>
- <span class="normal">1042</span>
- <span class="normal">1043</span>
- <span class="normal">1044</span>
- <span class="normal">1045</span>
- <span class="normal">1046</span>
- <span class="normal">1047</span>
- <span class="normal">1048</span>
- <span class="normal">1049</span>
- <span class="normal">1050</span>
- <span class="normal">1051</span>
- <span class="normal">1052</span>
- <span class="normal">1053</span>
- <span class="normal">1054</span>
- <span class="normal">1055</span>
- <span class="normal">1056</span>
- <span class="normal">1057</span>
- <span class="normal">1058</span>
- <span class="normal">1059</span>
- <span class="normal">1060</span>
- <span class="normal">1061</span>
- <span class="normal">1062</span>
- <span class="normal">1063</span>
- <span class="normal">1064</span>
- <span class="normal">1065</span>
- <span class="normal">1066</span>
- <span class="normal">1067</span>
- <span class="normal">1068</span>
- <span class="normal">1069</span>
- <span class="normal">1070</span>
- <span class="normal">1071</span>
- <span class="normal">1072</span>
- <span class="normal">1073</span>
- <span class="normal">1074</span>
- <span class="normal">1075</span>
- <span class="normal">1076</span>
- <span class="normal">1077</span>
- <span class="normal">1078</span>
- <span class="normal">1079</span></pre></div></td><td class="code"><div><pre><span></span><code><span class="k">class</span> <span class="nc">Agent</span><span class="p">:</span>
- <span class="w"> </span><span class="sd">"""Agent handles the behaviour of the model and how it interacts with the environment."""</span>
- <span class="k">def</span> <span class="fm">__init__</span><span class="p">(</span><span class="bp">self</span><span class="p">,</span> <span class="n">name</span><span class="p">:</span> <span class="nb">str</span><span class="p">,</span> <span class="n">args</span><span class="p">:</span> <span class="n">AgentArguments</span><span class="p">):</span>
- <span class="bp">self</span><span class="o">.</span><span class="n">name</span> <span class="o">=</span> <span class="n">name</span>
- <span class="c1"># todo: currently only used to get the model name, so might remove this later</span>
- <span class="bp">self</span><span class="o">.</span><span class="n">_args</span> <span class="o">=</span> <span class="n">args</span>
- <span class="bp">self</span><span class="o">.</span><span class="n">model</span> <span class="o">=</span> <span class="n">get_model</span><span class="p">(</span><span class="n">args</span><span class="o">.</span><span class="n">model</span><span class="p">,</span> <span class="n">args</span><span class="o">.</span><span class="n">config</span><span class="o">.</span><span class="n">_commands</span> <span class="o">+</span> <span class="n">args</span><span class="o">.</span><span class="n">config</span><span class="o">.</span><span class="n">subroutine_types</span><span class="p">)</span>
- <span class="bp">self</span><span class="o">.</span><span class="n">summarizer_model</span> <span class="o">=</span> <span class="n">get_model</span><span class="p">(</span>
- <span class="n">args</span><span class="o">.</span><span class="n">config</span><span class="o">.</span><span class="n">summarizer_config</span><span class="o">.</span><span class="n">model</span> <span class="k">if</span> <span class="n">args</span><span class="o">.</span><span class="n">config</span><span class="o">.</span><span class="n">summarizer_config</span><span class="o">.</span><span class="n">model</span> <span class="ow">is</span> <span class="ow">not</span> <span class="kc">None</span> <span class="k">else</span> <span class="n">args</span><span class="o">.</span><span class="n">model</span>
- <span class="p">)</span>
- <span class="bp">self</span><span class="o">.</span><span class="n">config</span> <span class="o">=</span> <span class="n">args</span><span class="o">.</span><span class="n">config</span>
- <span class="k">assert</span> <span class="bp">self</span><span class="o">.</span><span class="n">config</span> <span class="ow">is</span> <span class="ow">not</span> <span class="kc">None</span> <span class="c1"># mypy</span>
- <span class="bp">self</span><span class="o">.</span><span class="n">system_args</span> <span class="o">=</span> <span class="p">{</span>
- <span class="s2">"command_docs"</span><span class="p">:</span> <span class="bp">self</span><span class="o">.</span><span class="n">config</span><span class="o">.</span><span class="n">command_docs</span><span class="p">,</span>
- <span class="o">**</span><span class="bp">self</span><span class="o">.</span><span class="n">config</span><span class="o">.</span><span class="n">env_variables</span><span class="p">,</span>
- <span class="p">}</span>
- <span class="bp">self</span><span class="o">.</span><span class="n">instance_args</span> <span class="o">=</span> <span class="kc">None</span>
- <span class="bp">self</span><span class="o">.</span><span class="n">_parse_command_patterns</span><span class="p">()</span>
- <span class="bp">self</span><span class="o">.</span><span class="n">last_container_id</span> <span class="o">=</span> <span class="kc">None</span>
- <span class="bp">self</span><span class="o">.</span><span class="n">hooks</span> <span class="o">=</span> <span class="p">[]</span>
- <span class="bp">self</span><span class="o">.</span><span class="n">logger</span> <span class="o">=</span> <span class="n">get_logger</span><span class="p">(</span><span class="s2">"agent"</span><span class="p">)</span>
- <span class="c1"># Requires instance, so is set in `setup` methods</span>
- <span class="bp">self</span><span class="o">.</span><span class="n">_rloop</span> <span class="o">=</span> <span class="kc">None</span>
- <span class="c1"># Set in run method</span>
- <span class="bp">self</span><span class="o">.</span><span class="n">_env</span><span class="p">:</span> <span class="n">SWEEnv</span> <span class="o">|</span> <span class="kc">None</span> <span class="o">=</span> <span class="kc">None</span>
- <span class="bp">self</span><span class="o">.</span><span class="n">traj_dir</span><span class="p">:</span> <span class="kc">None</span> <span class="o">|</span> <span class="n">Path</span> <span class="o">=</span> <span class="kc">None</span>
- <span class="c1">#: Number of attempts to solve the issue when using a review loop</span>
- <span class="bp">self</span><span class="o">.</span><span class="n">_i_attempt</span><span class="p">:</span> <span class="nb">int</span> <span class="o">=</span> <span class="mi">0</span>
- <span class="c1">#: The following three attributes collect the information about how the agent</span>
- <span class="c1">#: solved the problem.</span>
- <span class="bp">self</span><span class="o">.</span><span class="n">_history_by_attempt</span><span class="p">:</span> <span class="nb">dict</span><span class="p">[</span><span class="nb">int</span><span class="p">,</span> <span class="nb">list</span><span class="p">]</span> <span class="o">=</span> <span class="n">defaultdict</span><span class="p">(</span><span class="nb">list</span><span class="p">)</span>
- <span class="bp">self</span><span class="o">.</span><span class="n">_trajectory_by_attempt</span><span class="p">:</span> <span class="nb">dict</span><span class="p">[</span><span class="nb">int</span><span class="p">,</span> <span class="n">Trajectory</span><span class="p">]</span> <span class="o">=</span> <span class="n">defaultdict</span><span class="p">(</span><span class="nb">list</span><span class="p">)</span>
- <span class="bp">self</span><span class="o">.</span><span class="n">_info_by_attempt</span><span class="p">:</span> <span class="nb">dict</span><span class="p">[</span><span class="nb">int</span><span class="p">,</span> <span class="n">AgentInfo</span><span class="p">]</span> <span class="o">=</span> <span class="n">defaultdict</span><span class="p">(</span><span class="nb">dict</span><span class="p">)</span>
- <span class="c1">#: Variables to be referenced in the templates that are forwarded from one</span>
- <span class="c1">#: solution attempt to the next</span>
- <span class="bp">self</span><span class="o">.</span><span class="n">_forwarded_vars</span><span class="p">:</span> <span class="nb">dict</span><span class="p">[</span><span class="nb">str</span><span class="p">,</span> <span class="n">Any</span><span class="p">]</span> <span class="o">=</span> <span class="p">{}</span>
- <span class="nd">@property</span>
- <span class="k">def</span> <span class="nf">history</span><span class="p">(</span><span class="bp">self</span><span class="p">)</span> <span class="o">-></span> <span class="n">History</span><span class="p">:</span>
- <span class="w"> </span><span class="sd">"""History that is passed on to the model.</span>
- <span class="sd"> Use `_append_history` to modify.</span>
- <span class="sd"> """</span>
- <span class="k">return</span> <span class="bp">self</span><span class="o">.</span><span class="n">_history_by_attempt</span><span class="p">[</span><span class="bp">self</span><span class="o">.</span><span class="n">_i_attempt</span><span class="p">]</span>
- <span class="nd">@history</span><span class="o">.</span><span class="n">setter</span>
- <span class="k">def</span> <span class="nf">history</span><span class="p">(</span><span class="bp">self</span><span class="p">,</span> <span class="n">value</span><span class="p">:</span> <span class="n">History</span><span class="p">):</span>
- <span class="bp">self</span><span class="o">.</span><span class="n">_history_by_attempt</span><span class="p">[</span><span class="bp">self</span><span class="o">.</span><span class="n">_i_attempt</span><span class="p">]</span> <span class="o">=</span> <span class="n">value</span>
- <span class="nd">@property</span>
- <span class="k">def</span> <span class="nf">trajectory</span><span class="p">(</span><span class="bp">self</span><span class="p">)</span> <span class="o">-></span> <span class="n">Trajectory</span><span class="p">:</span>
- <span class="w"> </span><span class="sd">"""Trajectory of the agent for the current instance. In contrast to `history`,</span>
- <span class="sd"> this is mostly for the informational value of how the agent interacted with</span>
- <span class="sd"> the environment and is also what is being used when replaying the trajectory</span>
- <span class="sd"> """</span>
- <span class="k">return</span> <span class="bp">self</span><span class="o">.</span><span class="n">_trajectory_by_attempt</span><span class="p">[</span><span class="bp">self</span><span class="o">.</span><span class="n">_i_attempt</span><span class="p">]</span>
- <span class="nd">@trajectory</span><span class="o">.</span><span class="n">setter</span>
- <span class="k">def</span> <span class="nf">trajectory</span><span class="p">(</span><span class="bp">self</span><span class="p">,</span> <span class="n">value</span><span class="p">:</span> <span class="n">Trajectory</span><span class="p">):</span>
- <span class="bp">self</span><span class="o">.</span><span class="n">_trajectory_by_attempt</span><span class="p">[</span><span class="bp">self</span><span class="o">.</span><span class="n">_i_attempt</span><span class="p">]</span> <span class="o">=</span> <span class="n">value</span>
- <span class="nd">@property</span>
- <span class="k">def</span> <span class="nf">info</span><span class="p">(</span><span class="bp">self</span><span class="p">)</span> <span class="o">-></span> <span class="n">AgentInfo</span><span class="p">:</span>
- <span class="w"> </span><span class="sd">"""Information about the agent's run"""</span>
- <span class="k">return</span> <span class="bp">self</span><span class="o">.</span><span class="n">_info_by_attempt</span><span class="p">[</span><span class="bp">self</span><span class="o">.</span><span class="n">_i_attempt</span><span class="p">]</span>
- <span class="nd">@info</span><span class="o">.</span><span class="n">setter</span>
- <span class="k">def</span> <span class="nf">info</span><span class="p">(</span><span class="bp">self</span><span class="p">,</span> <span class="n">value</span><span class="p">:</span> <span class="n">AgentInfo</span><span class="p">):</span>
- <span class="bp">self</span><span class="o">.</span><span class="n">_info_by_attempt</span><span class="p">[</span><span class="bp">self</span><span class="o">.</span><span class="n">_i_attempt</span><span class="p">]</span> <span class="o">=</span> <span class="n">value</span>
- <span class="nd">@property</span>
- <span class="k">def</span> <span class="nf">traj_path</span><span class="p">(</span><span class="bp">self</span><span class="p">)</span> <span class="o">-></span> <span class="n">Path</span> <span class="o">|</span> <span class="kc">None</span><span class="p">:</span>
- <span class="w"> </span><span class="sd">"""Returns path to the trajectory.</span>
- <span class="sd"> The path is reset for every new instance.</span>
- <span class="sd"> """</span>
- <span class="k">if</span> <span class="bp">self</span><span class="o">.</span><span class="n">traj_dir</span> <span class="ow">and</span> <span class="bp">self</span><span class="o">.</span><span class="n">_env</span> <span class="ow">is</span> <span class="ow">not</span> <span class="kc">None</span><span class="p">:</span>
- <span class="k">assert</span> <span class="bp">self</span><span class="o">.</span><span class="n">_env</span><span class="o">.</span><span class="n">record</span>
- <span class="k">return</span> <span class="bp">self</span><span class="o">.</span><span class="n">traj_dir</span> <span class="o">/</span> <span class="p">(</span><span class="bp">self</span><span class="o">.</span><span class="n">_env</span><span class="o">.</span><span class="n">record</span><span class="p">[</span><span class="s2">"instance_id"</span><span class="p">]</span> <span class="o">+</span> <span class="s2">".traj"</span><span class="p">)</span>
- <span class="k">return</span> <span class="kc">None</span>
- <span class="k">def</span> <span class="nf">add_hook</span><span class="p">(</span><span class="bp">self</span><span class="p">,</span> <span class="n">hook</span><span class="p">:</span> <span class="n">AgentHook</span><span class="p">)</span> <span class="o">-></span> <span class="kc">None</span><span class="p">:</span>
- <span class="w"> </span><span class="sd">"""Add hook to agent"""</span>
- <span class="n">hook</span><span class="o">.</span><span class="n">on_init</span><span class="p">(</span><span class="n">agent</span><span class="o">=</span><span class="bp">self</span><span class="p">)</span>
- <span class="bp">self</span><span class="o">.</span><span class="n">hooks</span><span class="o">.</span><span class="n">append</span><span class="p">(</span><span class="n">hook</span><span class="p">)</span>
- <span class="k">def</span> <span class="nf">_append_history</span><span class="p">(</span><span class="bp">self</span><span class="p">,</span> <span class="n">item</span><span class="p">:</span> <span class="n">HistoryItem</span><span class="p">)</span> <span class="o">-></span> <span class="kc">None</span><span class="p">:</span>
- <span class="w"> </span><span class="sd">"""Adds an item to the history."""</span>
- <span class="k">for</span> <span class="n">hook</span> <span class="ow">in</span> <span class="bp">self</span><span class="o">.</span><span class="n">hooks</span><span class="p">:</span>
- <span class="n">hook</span><span class="o">.</span><span class="n">on_query_message_added</span><span class="p">(</span><span class="o">**</span><span class="n">item</span><span class="p">)</span>
- <span class="bp">self</span><span class="o">.</span><span class="n">history</span><span class="o">.</span><span class="n">append</span><span class="p">(</span><span class="n">item</span><span class="p">)</span>
- <span class="c1"># todo: klieret: Long term: Might make more sense to reinitialize the agent class for every instance instead of this</span>
- <span class="k">def</span> <span class="nf">setup</span><span class="p">(</span><span class="bp">self</span><span class="p">,</span> <span class="n">instance_args</span><span class="p">:</span> <span class="nb">dict</span><span class="p">[</span><span class="nb">str</span><span class="p">,</span> <span class="n">Any</span><span class="p">],</span> <span class="n">init_model_stats</span><span class="p">:</span> <span class="n">APIStats</span> <span class="o">|</span> <span class="kc">None</span> <span class="o">=</span> <span class="kc">None</span><span class="p">)</span> <span class="o">-></span> <span class="kc">None</span><span class="p">:</span>
- <span class="w"> </span><span class="sd">"""Setup the agent for a new instance. This includes</span>
- <span class="sd"> formatting the system message and adding demonstrations to the history.</span>
- <span class="sd"> Args:</span>
- <span class="sd"> instance_args: Arguments for the instance</span>
- <span class="sd"> """</span>
- <span class="k">assert</span> <span class="bp">self</span><span class="o">.</span><span class="n">config</span> <span class="ow">is</span> <span class="ow">not</span> <span class="kc">None</span> <span class="c1"># mypy</span>
- <span class="bp">self</span><span class="o">.</span><span class="n">instance_args</span> <span class="o">=</span> <span class="n">instance_args</span>
- <span class="bp">self</span><span class="o">.</span><span class="n">_i_attempt</span> <span class="o">=</span> <span class="mi">0</span>
- <span class="bp">self</span><span class="o">.</span><span class="n">_history_by_attempt</span> <span class="o">=</span> <span class="n">defaultdict</span><span class="p">(</span><span class="nb">list</span><span class="p">)</span>
- <span class="bp">self</span><span class="o">.</span><span class="n">_trajectory_by_attempt</span> <span class="o">=</span> <span class="n">defaultdict</span><span class="p">(</span><span class="nb">list</span><span class="p">)</span>
- <span class="bp">self</span><span class="o">.</span><span class="n">_info_by_attempt</span> <span class="o">=</span> <span class="n">defaultdict</span><span class="p">(</span><span class="nb">dict</span><span class="p">)</span> <span class="c1"># type: ignore</span>
- <span class="bp">self</span><span class="o">.</span><span class="n">_forwarded_vars</span> <span class="o">=</span> <span class="p">{}</span>
- <span class="k">if</span> <span class="bp">self</span><span class="o">.</span><span class="n">_rloop</span> <span class="ow">is</span> <span class="ow">not</span> <span class="kc">None</span><span class="p">:</span>
- <span class="bp">self</span><span class="o">.</span><span class="n">_forwarded_vars</span> <span class="o">=</span> <span class="bp">self</span><span class="o">.</span><span class="n">_rloop</span><span class="o">.</span><span class="n">get_forwarded_vars</span><span class="p">()</span>
- <span class="bp">self</span><span class="o">.</span><span class="n">setup_attempt</span><span class="p">(</span><span class="n">init_model_stats</span><span class="o">=</span><span class="n">init_model_stats</span><span class="p">)</span>
- <span class="k">for</span> <span class="n">hook</span> <span class="ow">in</span> <span class="bp">self</span><span class="o">.</span><span class="n">hooks</span><span class="p">:</span>
- <span class="n">hook</span><span class="o">.</span><span class="n">on_setup_done</span><span class="p">()</span>
- <span class="k">def</span> <span class="nf">setup_attempt</span><span class="p">(</span><span class="bp">self</span><span class="p">,</span> <span class="o">*</span><span class="p">,</span> <span class="n">init_model_stats</span><span class="p">:</span> <span class="n">APIStats</span> <span class="o">|</span> <span class="kc">None</span> <span class="o">=</span> <span class="kc">None</span><span class="p">)</span> <span class="o">-></span> <span class="kc">None</span><span class="p">:</span>
- <span class="w"> </span><span class="sd">"""Setup the agent for a new attempt. This includes resetting the model stats."""</span>
- <span class="k">assert</span> <span class="bp">self</span><span class="o">.</span><span class="n">config</span> <span class="ow">is</span> <span class="ow">not</span> <span class="kc">None</span> <span class="c1"># mypy</span>
- <span class="k">if</span> <span class="bp">self</span><span class="o">.</span><span class="n">_i_attempt</span> <span class="o">></span> <span class="mi">0</span> <span class="ow">and</span> <span class="n">init_model_stats</span> <span class="ow">is</span> <span class="ow">not</span> <span class="kc">None</span><span class="p">:</span>
- <span class="n">msg</span> <span class="o">=</span> <span class="p">(</span>
- <span class="s2">"We might be dealing with nested retries, where subroutines are mixed with retries. "</span>
- <span class="s2">"Currently, this messes up accounting with init_model_stats."</span>
- <span class="p">)</span>
- <span class="k">raise</span> <span class="ne">ValueError</span><span class="p">(</span><span class="n">msg</span><span class="p">)</span>
- <span class="k">if</span> <span class="bp">self</span><span class="o">.</span><span class="n">_i_attempt</span> <span class="o">></span> <span class="mi">0</span><span class="p">:</span>
- <span class="k">assert</span> <span class="bp">self</span><span class="o">.</span><span class="n">_env</span> <span class="ow">is</span> <span class="ow">not</span> <span class="kc">None</span> <span class="c1"># mypy</span>
- <span class="bp">self</span><span class="o">.</span><span class="n">_env</span><span class="o">.</span><span class="n">reset_for_new_attempt</span><span class="p">()</span>
- <span class="bp">self</span><span class="o">.</span><span class="n">model</span><span class="o">.</span><span class="n">reset_stats</span><span class="p">(</span><span class="n">init_model_stats</span><span class="p">)</span>
- <span class="c1"># self.model = get_model(self._args.model, self.config._commands + self.config.subroutine_types)</span>
- <span class="c1"># fixme: This doesn't reset total cost</span>
- <span class="n">system_msg</span> <span class="o">=</span> <span class="bp">self</span><span class="o">.</span><span class="n">config</span><span class="o">.</span><span class="n">system_template</span><span class="o">.</span><span class="n">format</span><span class="p">(</span><span class="o">**</span><span class="bp">self</span><span class="o">.</span><span class="n">system_args</span><span class="p">,</span> <span class="o">**</span><span class="bp">self</span><span class="o">.</span><span class="n">instance_args</span><span class="p">)</span>
- <span class="bp">self</span><span class="o">.</span><span class="n">logger</span><span class="o">.</span><span class="n">info</span><span class="p">(</span><span class="sa">f</span><span class="s2">"SYSTEM (</span><span class="si">{</span><span class="bp">self</span><span class="o">.</span><span class="n">name</span><span class="si">}</span><span class="s2">)</span><span class="se">\n</span><span class="si">{</span><span class="n">system_msg</span><span class="si">}</span><span class="s2">"</span><span class="p">)</span>
- <span class="bp">self</span><span class="o">.</span><span class="n">_append_history</span><span class="p">(</span><span class="n">HistoryItem</span><span class="p">({</span><span class="s2">"role"</span><span class="p">:</span> <span class="s2">"system"</span><span class="p">,</span> <span class="s2">"content"</span><span class="p">:</span> <span class="n">system_msg</span><span class="p">,</span> <span class="s2">"agent"</span><span class="p">:</span> <span class="bp">self</span><span class="o">.</span><span class="n">name</span><span class="p">}))</span>
- <span class="k">if</span> <span class="s2">"history_to_messages"</span> <span class="ow">in</span> <span class="nb">dir</span><span class="p">(</span><span class="bp">self</span><span class="o">.</span><span class="n">model</span><span class="p">):</span>
- <span class="k">for</span> <span class="n">demonstration_path</span> <span class="ow">in</span> <span class="bp">self</span><span class="o">.</span><span class="n">config</span><span class="o">.</span><span class="n">demonstrations</span><span class="p">:</span>
- <span class="k">if</span> <span class="bp">self</span><span class="o">.</span><span class="n">config</span><span class="o">.</span><span class="n">demonstration_template</span> <span class="ow">is</span> <span class="kc">None</span> <span class="ow">and</span> <span class="ow">not</span> <span class="bp">self</span><span class="o">.</span><span class="n">config</span><span class="o">.</span><span class="n">put_demos_in_history</span><span class="p">:</span>
- <span class="n">msg</span> <span class="o">=</span> <span class="s2">"Cannot use demonstrations without a demonstration template or put_demos_in_history=True"</span>
- <span class="k">raise</span> <span class="ne">ValueError</span><span class="p">(</span><span class="n">msg</span><span class="p">)</span>
- <span class="c1"># Load history</span>
- <span class="bp">self</span><span class="o">.</span><span class="n">logger</span><span class="o">.</span><span class="n">info</span><span class="p">(</span><span class="sa">f</span><span class="s2">"DEMONSTRATION: </span><span class="si">{</span><span class="n">demonstration_path</span><span class="si">}</span><span class="s2">"</span><span class="p">)</span>
- <span class="n">demo_history</span> <span class="o">=</span> <span class="n">json</span><span class="o">.</span><span class="n">loads</span><span class="p">(</span><span class="n">Path</span><span class="p">(</span><span class="n">demonstration_path</span><span class="p">)</span><span class="o">.</span><span class="n">read_text</span><span class="p">())[</span><span class="s2">"history"</span><span class="p">]</span>
- <span class="n">demo_history</span> <span class="o">=</span> <span class="p">[</span>
- <span class="n">entry</span>
- <span class="k">for</span> <span class="n">entry</span> <span class="ow">in</span> <span class="n">demo_history</span>
- <span class="k">if</span> <span class="p">(</span><span class="s2">"agent"</span> <span class="ow">not</span> <span class="ow">in</span> <span class="n">entry</span><span class="p">)</span> <span class="ow">or</span> <span class="p">(</span><span class="s2">"agent"</span> <span class="ow">in</span> <span class="n">entry</span> <span class="ow">and</span> <span class="n">entry</span><span class="p">[</span><span class="s2">"agent"</span><span class="p">]</span> <span class="o">==</span> <span class="bp">self</span><span class="o">.</span><span class="n">name</span><span class="p">)</span>
- <span class="p">]</span>
- <span class="k">if</span> <span class="bp">self</span><span class="o">.</span><span class="n">config</span><span class="o">.</span><span class="n">put_demos_in_history</span><span class="p">:</span>
- <span class="k">if</span> <span class="bp">self</span><span class="o">.</span><span class="n">config</span><span class="o">.</span><span class="n">demonstration_template</span> <span class="ow">is</span> <span class="ow">not</span> <span class="kc">None</span><span class="p">:</span>
- <span class="bp">self</span><span class="o">.</span><span class="n">logger</span><span class="o">.</span><span class="n">warning</span><span class="p">(</span><span class="s2">"Demonstration template is ignored for put_demos_in_history=True"</span><span class="p">)</span>
- <span class="c1"># Add demonstration to history directly as separate messages</span>
- <span class="k">for</span> <span class="n">entry</span> <span class="ow">in</span> <span class="n">demo_history</span><span class="p">:</span>
- <span class="k">if</span> <span class="n">entry</span><span class="p">[</span><span class="s2">"role"</span><span class="p">]</span> <span class="o">!=</span> <span class="s2">"system"</span><span class="p">:</span>
- <span class="n">entry</span><span class="p">[</span><span class="s2">"is_demo"</span><span class="p">]</span> <span class="o">=</span> <span class="kc">True</span>
- <span class="bp">self</span><span class="o">.</span><span class="n">_append_history</span><span class="p">(</span><span class="n">entry</span><span class="p">)</span>
- <span class="k">else</span><span class="p">:</span>
- <span class="c1"># Add demonstration as single message to history</span>
- <span class="n">demo_message</span> <span class="o">=</span> <span class="bp">self</span><span class="o">.</span><span class="n">model</span><span class="o">.</span><span class="n">history_to_messages</span><span class="p">(</span>
- <span class="n">demo_history</span><span class="p">,</span>
- <span class="n">is_demonstration</span><span class="o">=</span><span class="kc">True</span><span class="p">,</span>
- <span class="p">)</span>
- <span class="n">demonstration</span> <span class="o">=</span> <span class="bp">self</span><span class="o">.</span><span class="n">config</span><span class="o">.</span><span class="n">demonstration_template</span><span class="o">.</span><span class="n">format</span><span class="p">(</span><span class="n">demonstration</span><span class="o">=</span><span class="n">demo_message</span><span class="p">)</span>
- <span class="bp">self</span><span class="o">.</span><span class="n">_append_history</span><span class="p">(</span>
- <span class="p">{</span>
- <span class="s2">"agent"</span><span class="p">:</span> <span class="bp">self</span><span class="o">.</span><span class="n">name</span><span class="p">,</span>
- <span class="s2">"content"</span><span class="p">:</span> <span class="n">demonstration</span><span class="p">,</span>
- <span class="s2">"is_demo"</span><span class="p">:</span> <span class="kc">True</span><span class="p">,</span>
- <span class="s2">"role"</span><span class="p">:</span> <span class="s2">"user"</span><span class="p">,</span>
- <span class="p">},</span>
- <span class="p">)</span>
- <span class="nd">@property</span>
- <span class="k">def</span> <span class="nf">state_command</span><span class="p">(</span><span class="bp">self</span><span class="p">)</span> <span class="o">-></span> <span class="nb">str</span><span class="p">:</span>
- <span class="w"> </span><span class="sd">"""Return the bash command that will be used to extract the environment state."""</span>
- <span class="k">assert</span> <span class="bp">self</span><span class="o">.</span><span class="n">config</span> <span class="ow">is</span> <span class="ow">not</span> <span class="kc">None</span>
- <span class="k">return</span> <span class="bp">self</span><span class="o">.</span><span class="n">config</span><span class="o">.</span><span class="n">state_command</span><span class="o">.</span><span class="n">name</span>
- <span class="nd">@property</span>
- <span class="k">def</span> <span class="nf">local_history</span><span class="p">(</span><span class="bp">self</span><span class="p">)</span> <span class="o">-></span> <span class="nb">list</span><span class="p">[</span><span class="nb">dict</span><span class="p">[</span><span class="nb">str</span><span class="p">,</span> <span class="nb">str</span><span class="p">]]:</span>
- <span class="w"> </span><span class="sd">"""Return the history of the agent since the last reset."""</span>
- <span class="k">return</span> <span class="bp">self</span><span class="o">.</span><span class="n">config</span><span class="o">.</span><span class="n">history_processor</span><span class="p">([</span><span class="n">entry</span> <span class="k">for</span> <span class="n">entry</span> <span class="ow">in</span> <span class="bp">self</span><span class="o">.</span><span class="n">history</span> <span class="k">if</span> <span class="n">entry</span><span class="p">[</span><span class="s2">"agent"</span><span class="p">]</span> <span class="o">==</span> <span class="bp">self</span><span class="o">.</span><span class="n">name</span><span class="p">])</span>
- <span class="k">def</span> <span class="nf">_get_total_stats</span><span class="p">(</span><span class="bp">self</span><span class="p">)</span> <span class="o">-></span> <span class="n">APIStats</span><span class="p">:</span>
- <span class="w"> </span><span class="sd">"""Combine model stats of different attempts"""</span>
- <span class="n">total_stats</span> <span class="o">=</span> <span class="n">APIStats</span><span class="p">()</span>
- <span class="k">for</span> <span class="n">stats</span> <span class="ow">in</span> <span class="bp">self</span><span class="o">.</span><span class="n">_info_by_attempt</span><span class="o">.</span><span class="n">values</span><span class="p">():</span>
- <span class="k">assert</span> <span class="s2">"model_stats"</span> <span class="ow">in</span> <span class="n">stats</span> <span class="c1"># mypy</span>
- <span class="n">attempt_stats</span> <span class="o">=</span> <span class="n">APIStats</span><span class="p">(</span><span class="o">**</span><span class="n">stats</span><span class="p">[</span><span class="s2">"model_stats"</span><span class="p">])</span> <span class="c1"># type: ignore</span>
- <span class="n">total_stats</span> <span class="o">+=</span> <span class="n">attempt_stats</span>
- <span class="k">if</span> <span class="bp">self</span><span class="o">.</span><span class="n">_rloop</span> <span class="ow">is</span> <span class="ow">not</span> <span class="kc">None</span><span class="p">:</span>
- <span class="n">total_stats</span> <span class="o">+=</span> <span class="bp">self</span><span class="o">.</span><span class="n">_rloop</span><span class="o">.</span><span class="n">model_stats</span>
- <span class="k">return</span> <span class="n">total_stats</span>
- <span class="k">def</span> <span class="nf">save_trajectory</span><span class="p">(</span>
- <span class="bp">self</span><span class="p">,</span>
- <span class="p">)</span> <span class="o">-></span> <span class="kc">None</span><span class="p">:</span>
- <span class="w"> </span><span class="sd">"""Save the trajectory to disk.</span>
- <span class="sd"> This includes the history, the environment state, and the model stats.</span>
- <span class="sd"> """</span>
- <span class="k">def</span> <span class="nf">get_attempt_data</span><span class="p">(</span><span class="n">attempt_idx</span><span class="p">:</span> <span class="nb">int</span><span class="p">)</span> <span class="o">-></span> <span class="nb">dict</span><span class="p">[</span><span class="nb">str</span><span class="p">,</span> <span class="n">Any</span><span class="p">]:</span>
- <span class="w"> </span><span class="sd">"""Get data saved for every attempt"""</span>
- <span class="k">assert</span> <span class="bp">self</span><span class="o">.</span><span class="n">_env</span> <span class="ow">is</span> <span class="ow">not</span> <span class="kc">None</span>
- <span class="c1"># The deepcopy here is important because else the</span>
- <span class="c1"># data["info"]["model_stats"] update will create havoc!</span>
- <span class="k">return</span> <span class="n">copy</span><span class="o">.</span><span class="n">deepcopy</span><span class="p">(</span>
- <span class="p">{</span>
- <span class="s2">"environment"</span><span class="p">:</span> <span class="bp">self</span><span class="o">.</span><span class="n">_env</span><span class="o">.</span><span class="n">name</span><span class="p">,</span>
- <span class="s2">"trajectory"</span><span class="p">:</span> <span class="bp">self</span><span class="o">.</span><span class="n">_trajectory_by_attempt</span><span class="p">[</span><span class="n">attempt_idx</span><span class="p">],</span>
- <span class="s2">"history"</span><span class="p">:</span> <span class="bp">self</span><span class="o">.</span><span class="n">_history_by_attempt</span><span class="p">[</span><span class="n">attempt_idx</span><span class="p">],</span>
- <span class="s2">"info"</span><span class="p">:</span> <span class="bp">self</span><span class="o">.</span><span class="n">_info_by_attempt</span><span class="p">[</span><span class="n">attempt_idx</span><span class="p">],</span>
- <span class="p">}</span>
- <span class="p">)</span>
- <span class="n">data</span> <span class="o">=</span> <span class="p">{</span>
- <span class="o">**</span><span class="n">get_attempt_data</span><span class="p">(</span><span class="mi">0</span><span class="p">),</span>
- <span class="p">}</span>
- <span class="k">assert</span> <span class="bp">self</span><span class="o">.</span><span class="n">traj_path</span> <span class="ow">is</span> <span class="ow">not</span> <span class="kc">None</span>
- <span class="bp">self</span><span class="o">.</span><span class="n">traj_path</span><span class="o">.</span><span class="n">write_text</span><span class="p">(</span><span class="n">json</span><span class="o">.</span><span class="n">dumps</span><span class="p">(</span><span class="n">data</span><span class="p">,</span> <span class="n">indent</span><span class="o">=</span><span class="mi">2</span><span class="p">))</span>
- <span class="k">def</span> <span class="nf">_get_first_match</span><span class="p">(</span><span class="bp">self</span><span class="p">,</span> <span class="n">action</span><span class="p">:</span> <span class="nb">str</span><span class="p">,</span> <span class="n">pattern_type</span><span class="p">:</span> <span class="nb">str</span><span class="p">)</span> <span class="o">-></span> <span class="n">re</span><span class="o">.</span><span class="n">Match</span> <span class="o">|</span> <span class="kc">None</span><span class="p">:</span>
- <span class="w"> </span><span class="sd">"""Return the first match of a command pattern in the action string."""</span>
- <span class="k">assert</span> <span class="bp">self</span><span class="o">.</span><span class="n">config</span> <span class="ow">is</span> <span class="ow">not</span> <span class="kc">None</span> <span class="c1"># mypy</span>
- <span class="k">if</span> <span class="n">pattern_type</span> <span class="o">==</span> <span class="s2">"subroutine"</span><span class="p">:</span>
- <span class="n">patterns</span> <span class="o">=</span> <span class="p">{</span><span class="n">k</span><span class="p">:</span> <span class="n">v</span> <span class="k">for</span> <span class="n">k</span><span class="p">,</span> <span class="n">v</span> <span class="ow">in</span> <span class="bp">self</span><span class="o">.</span><span class="n">subroutine_patterns</span><span class="o">.</span><span class="n">items</span><span class="p">()}</span>
- <span class="k">elif</span> <span class="n">pattern_type</span> <span class="o">==</span> <span class="s2">"multi_line"</span><span class="p">:</span>
- <span class="n">patterns</span> <span class="o">=</span> <span class="p">{</span>
- <span class="n">k</span><span class="p">:</span> <span class="n">v</span>
- <span class="k">for</span> <span class="n">k</span><span class="p">,</span> <span class="n">v</span> <span class="ow">in</span> <span class="bp">self</span><span class="o">.</span><span class="n">command_patterns</span><span class="o">.</span><span class="n">items</span><span class="p">()</span>
- <span class="k">if</span> <span class="n">k</span> <span class="ow">in</span> <span class="bp">self</span><span class="o">.</span><span class="n">config</span><span class="o">.</span><span class="n">multi_line_command_endings</span> <span class="ow">or</span> <span class="n">k</span> <span class="o">==</span> <span class="bp">self</span><span class="o">.</span><span class="n">config</span><span class="o">.</span><span class="n">submit_command</span>
- <span class="p">}</span>
- <span class="n">patterns</span> <span class="o">+=</span> <span class="p">{</span>
- <span class="n">k</span><span class="p">:</span> <span class="n">v</span> <span class="k">for</span> <span class="n">k</span><span class="p">,</span> <span class="n">v</span> <span class="ow">in</span> <span class="bp">self</span><span class="o">.</span><span class="n">subroutine_patterns</span><span class="o">.</span><span class="n">items</span><span class="p">()</span> <span class="k">if</span> <span class="n">k</span> <span class="ow">in</span> <span class="bp">self</span><span class="o">.</span><span class="n">config</span><span class="o">.</span><span class="n">multi_line_command_endings</span>
- <span class="p">}</span>
- <span class="k">elif</span> <span class="n">pattern_type</span> <span class="o">==</span> <span class="s2">"multi_line_no_subroutines"</span><span class="p">:</span>
- <span class="n">patterns</span> <span class="o">=</span> <span class="p">{</span><span class="n">k</span><span class="p">:</span> <span class="n">v</span> <span class="k">for</span> <span class="n">k</span><span class="p">,</span> <span class="n">v</span> <span class="ow">in</span> <span class="bp">self</span><span class="o">.</span><span class="n">command_patterns</span><span class="o">.</span><span class="n">items</span><span class="p">()</span> <span class="k">if</span> <span class="n">k</span> <span class="ow">in</span> <span class="bp">self</span><span class="o">.</span><span class="n">config</span><span class="o">.</span><span class="n">multi_line_command_endings</span><span class="p">}</span>
- <span class="k">else</span><span class="p">:</span>
- <span class="n">msg</span> <span class="o">=</span> <span class="sa">f</span><span class="s2">"Unknown pattern type: </span><span class="si">{</span><span class="n">pattern_type</span><span class="si">}</span><span class="s2">"</span>
- <span class="k">raise</span> <span class="ne">ValueError</span><span class="p">(</span><span class="n">msg</span><span class="p">)</span>
- <span class="n">matches</span> <span class="o">=</span> <span class="nb">list</span><span class="p">()</span>
- <span class="k">for</span> <span class="n">_</span><span class="p">,</span> <span class="n">pat</span> <span class="ow">in</span> <span class="n">patterns</span><span class="o">.</span><span class="n">items</span><span class="p">():</span>
- <span class="n">match</span> <span class="o">=</span> <span class="n">pat</span><span class="o">.</span><span class="n">search</span><span class="p">(</span><span class="n">action</span><span class="p">)</span>
- <span class="k">if</span> <span class="n">match</span><span class="p">:</span>
- <span class="n">matches</span><span class="o">.</span><span class="n">append</span><span class="p">(</span><span class="n">match</span><span class="p">)</span>
- <span class="k">if</span> <span class="nb">len</span><span class="p">(</span><span class="n">matches</span><span class="p">)</span> <span class="o">==</span> <span class="mi">0</span><span class="p">:</span>
- <span class="k">return</span> <span class="kc">None</span>
- <span class="n">matches</span> <span class="o">=</span> <span class="nb">sorted</span><span class="p">(</span><span class="n">matches</span><span class="p">,</span> <span class="n">key</span><span class="o">=</span><span class="k">lambda</span> <span class="n">x</span><span class="p">:</span> <span class="n">x</span><span class="o">.</span><span class="n">start</span><span class="p">())</span>
- <span class="k">return</span> <span class="n">matches</span><span class="p">[</span><span class="mi">0</span><span class="p">]</span>
- <span class="k">def</span> <span class="nf">_guard_multiline_input</span><span class="p">(</span><span class="bp">self</span><span class="p">,</span> <span class="n">action</span><span class="p">:</span> <span class="nb">str</span><span class="p">)</span> <span class="o">-></span> <span class="nb">str</span><span class="p">:</span>
- <span class="w"> </span><span class="sd">"""Split action by multiline commands, then append the first line in each multiline command with "<< '{end_name}'".</span>
- <span class="sd"> Multiline commands (which are specified by an end_name) are commands that span multiple lines and are terminated by a specific end_name.</span>
- <span class="sd"> Their multi-line argument is sent using a heredoc, which is a way to send a multi-line string to a command in bash.</span>
- <span class="sd"> """</span>
- <span class="n">parsed_action</span> <span class="o">=</span> <span class="nb">list</span><span class="p">()</span>
- <span class="n">rem_action</span> <span class="o">=</span> <span class="n">action</span>
- <span class="k">while</span> <span class="n">rem_action</span><span class="o">.</span><span class="n">strip</span><span class="p">():</span>
- <span class="n">first_match</span> <span class="o">=</span> <span class="bp">self</span><span class="o">.</span><span class="n">_get_first_match</span><span class="p">(</span><span class="n">rem_action</span><span class="p">,</span> <span class="s2">"multi_line_no_subroutines"</span><span class="p">)</span>
- <span class="k">if</span> <span class="n">first_match</span><span class="p">:</span>
- <span class="n">pre_action</span> <span class="o">=</span> <span class="n">rem_action</span><span class="p">[:</span> <span class="n">first_match</span><span class="o">.</span><span class="n">start</span><span class="p">()]</span>
- <span class="n">match_action</span> <span class="o">=</span> <span class="n">rem_action</span><span class="p">[</span><span class="n">first_match</span><span class="o">.</span><span class="n">start</span><span class="p">()</span> <span class="p">:</span> <span class="n">first_match</span><span class="o">.</span><span class="n">end</span><span class="p">()]</span>
- <span class="n">rem_action</span> <span class="o">=</span> <span class="n">rem_action</span><span class="p">[</span><span class="n">first_match</span><span class="o">.</span><span class="n">end</span><span class="p">()</span> <span class="p">:]</span>
- <span class="k">if</span> <span class="n">pre_action</span><span class="o">.</span><span class="n">strip</span><span class="p">():</span>
- <span class="n">parsed_action</span><span class="o">.</span><span class="n">append</span><span class="p">(</span><span class="n">pre_action</span><span class="p">)</span>
- <span class="k">if</span> <span class="n">match_action</span><span class="o">.</span><span class="n">strip</span><span class="p">():</span>
- <span class="n">eof</span> <span class="o">=</span> <span class="n">first_match</span><span class="o">.</span><span class="n">group</span><span class="p">(</span><span class="mi">3</span><span class="p">)</span><span class="o">.</span><span class="n">strip</span><span class="p">()</span>
- <span class="k">if</span> <span class="ow">not</span> <span class="n">match_action</span><span class="o">.</span><span class="n">split</span><span class="p">(</span><span class="s2">"</span><span class="se">\n</span><span class="s2">"</span><span class="p">)[</span><span class="mi">0</span><span class="p">]</span><span class="o">.</span><span class="n">strip</span><span class="p">()</span><span class="o">.</span><span class="n">endswith</span><span class="p">(</span><span class="sa">f</span><span class="s2">"<< '</span><span class="si">{</span><span class="n">eof</span><span class="si">}</span><span class="s2">'"</span><span class="p">):</span>
- <span class="n">guarded_command</span> <span class="o">=</span> <span class="n">match_action</span><span class="p">[</span><span class="n">first_match</span><span class="o">.</span><span class="n">start</span><span class="p">()</span> <span class="p">:]</span>
- <span class="n">first_line</span> <span class="o">=</span> <span class="n">guarded_command</span><span class="o">.</span><span class="n">split</span><span class="p">(</span><span class="s2">"</span><span class="se">\n</span><span class="s2">"</span><span class="p">)[</span><span class="mi">0</span><span class="p">]</span>
- <span class="n">guarded_command</span> <span class="o">=</span> <span class="n">guarded_command</span><span class="o">.</span><span class="n">replace</span><span class="p">(</span><span class="n">first_line</span><span class="p">,</span> <span class="n">first_line</span> <span class="o">+</span> <span class="sa">f</span><span class="s2">" << '</span><span class="si">{</span><span class="n">eof</span><span class="si">}</span><span class="s2">'"</span><span class="p">,</span> <span class="mi">1</span><span class="p">)</span>
- <span class="n">parsed_action</span><span class="o">.</span><span class="n">append</span><span class="p">(</span><span class="n">guarded_command</span><span class="p">)</span>
- <span class="k">else</span><span class="p">:</span>
- <span class="n">parsed_action</span><span class="o">.</span><span class="n">append</span><span class="p">(</span><span class="n">match_action</span><span class="p">)</span>
- <span class="k">else</span><span class="p">:</span>
- <span class="n">parsed_action</span><span class="o">.</span><span class="n">append</span><span class="p">(</span><span class="n">rem_action</span><span class="p">)</span>
- <span class="n">rem_action</span> <span class="o">=</span> <span class="s2">""</span>
- <span class="k">return</span> <span class="s2">"</span><span class="se">\n</span><span class="s2">"</span><span class="o">.</span><span class="n">join</span><span class="p">(</span><span class="n">parsed_action</span><span class="p">)</span>
- <span class="k">def</span> <span class="nf">split_actions</span><span class="p">(</span><span class="bp">self</span><span class="p">,</span> <span class="n">action</span><span class="p">:</span> <span class="nb">str</span><span class="p">,</span> <span class="n">pattern_type</span><span class="o">=</span><span class="s2">"subroutine"</span><span class="p">)</span> <span class="o">-></span> <span class="nb">list</span><span class="p">[</span><span class="n">SubAction</span><span class="p">]:</span>
- <span class="w"> </span><span class="sd">"""Split an action into a list of actions in a greedy manner, each of which is a subroutine call or a single command."""</span>
- <span class="n">parsed_action</span><span class="p">:</span> <span class="nb">list</span><span class="p">[</span><span class="n">SubAction</span><span class="p">]</span> <span class="o">=</span> <span class="nb">list</span><span class="p">()</span>
- <span class="n">rem_action</span> <span class="o">=</span> <span class="n">action</span>
- <span class="k">while</span> <span class="n">rem_action</span><span class="o">.</span><span class="n">strip</span><span class="p">():</span>
- <span class="n">first_match</span> <span class="o">=</span> <span class="bp">self</span><span class="o">.</span><span class="n">_get_first_match</span><span class="p">(</span><span class="n">rem_action</span><span class="p">,</span> <span class="n">pattern_type</span><span class="p">)</span>
- <span class="k">if</span> <span class="n">first_match</span><span class="p">:</span>
- <span class="n">pre_action</span> <span class="o">=</span> <span class="n">rem_action</span><span class="p">[:</span> <span class="n">first_match</span><span class="o">.</span><span class="n">start</span><span class="p">()]</span>
- <span class="n">match_action</span> <span class="o">=</span> <span class="n">rem_action</span><span class="p">[</span><span class="n">first_match</span><span class="o">.</span><span class="n">start</span><span class="p">()</span> <span class="p">:</span> <span class="n">first_match</span><span class="o">.</span><span class="n">end</span><span class="p">()]</span>
- <span class="n">rem_action</span> <span class="o">=</span> <span class="n">rem_action</span><span class="p">[</span><span class="n">first_match</span><span class="o">.</span><span class="n">end</span><span class="p">()</span> <span class="p">:]</span>
- <span class="k">if</span> <span class="n">pre_action</span><span class="o">.</span><span class="n">strip</span><span class="p">():</span>
- <span class="n">parsed_action</span><span class="o">.</span><span class="n">append</span><span class="p">({</span><span class="s2">"agent"</span><span class="p">:</span> <span class="bp">self</span><span class="o">.</span><span class="n">name</span><span class="p">,</span> <span class="s2">"action"</span><span class="p">:</span> <span class="n">pre_action</span><span class="p">,</span> <span class="s2">"cmd_name"</span><span class="p">:</span> <span class="kc">None</span><span class="p">,</span> <span class="s2">"args"</span><span class="p">:</span> <span class="s2">""</span><span class="p">})</span>
- <span class="k">if</span> <span class="n">match_action</span><span class="o">.</span><span class="n">strip</span><span class="p">():</span>
- <span class="k">if</span> <span class="n">match_action</span><span class="o">.</span><span class="n">split</span><span class="p">()[</span><span class="mi">0</span><span class="p">]</span> <span class="o">==</span> <span class="bp">self</span><span class="o">.</span><span class="n">config</span><span class="o">.</span><span class="n">submit_command</span><span class="p">:</span>
- <span class="n">parsed_action</span><span class="o">.</span><span class="n">append</span><span class="p">(</span>
- <span class="n">SubAction</span><span class="p">(</span>
- <span class="p">{</span>
- <span class="s2">"agent"</span><span class="p">:</span> <span class="bp">self</span><span class="o">.</span><span class="n">name</span><span class="p">,</span>
- <span class="s2">"action"</span><span class="p">:</span> <span class="n">match_action</span><span class="p">,</span>
- <span class="s2">"cmd_name"</span><span class="p">:</span> <span class="n">first_match</span><span class="o">.</span><span class="n">group</span><span class="p">(</span><span class="mi">1</span><span class="p">),</span>
- <span class="s2">"args"</span><span class="p">:</span> <span class="s2">""</span><span class="p">,</span>
- <span class="p">},</span>
- <span class="p">)</span>
- <span class="p">)</span> <span class="c1"># submit command is not a subroutine</span>
- <span class="k">else</span><span class="p">:</span>
- <span class="n">parsed_action</span><span class="o">.</span><span class="n">append</span><span class="p">(</span>
- <span class="n">SubAction</span><span class="p">(</span>
- <span class="p">{</span>
- <span class="s2">"agent"</span><span class="p">:</span> <span class="n">first_match</span><span class="o">.</span><span class="n">group</span><span class="p">(</span><span class="mi">1</span><span class="p">),</span>
- <span class="s2">"args"</span><span class="p">:</span> <span class="n">first_match</span><span class="o">.</span><span class="n">group</span><span class="p">(</span><span class="mi">2</span><span class="p">),</span>
- <span class="s2">"action"</span><span class="p">:</span> <span class="n">match_action</span><span class="p">,</span>
- <span class="s2">"cmd_name"</span><span class="p">:</span> <span class="n">first_match</span><span class="o">.</span><span class="n">group</span><span class="p">(</span><span class="mi">1</span><span class="p">),</span>
- <span class="p">},</span>
- <span class="p">)</span>
- <span class="p">)</span>
- <span class="k">else</span><span class="p">:</span>
- <span class="n">parsed_action</span><span class="o">.</span><span class="n">append</span><span class="p">(</span>
- <span class="n">SubAction</span><span class="p">({</span><span class="s2">"agent"</span><span class="p">:</span> <span class="bp">self</span><span class="o">.</span><span class="n">name</span><span class="p">,</span> <span class="s2">"action"</span><span class="p">:</span> <span class="n">rem_action</span><span class="p">,</span> <span class="s2">"cmd_name"</span><span class="p">:</span> <span class="kc">None</span><span class="p">,</span> <span class="s2">"args"</span><span class="p">:</span> <span class="s2">""</span><span class="p">})</span>
- <span class="p">)</span>
- <span class="n">rem_action</span> <span class="o">=</span> <span class="s2">""</span>
- <span class="k">return</span> <span class="n">parsed_action</span>
- <span class="k">def</span> <span class="nf">_parse_command_patterns</span><span class="p">(</span><span class="bp">self</span><span class="p">)</span> <span class="o">-></span> <span class="kc">None</span><span class="p">:</span>
- <span class="k">assert</span> <span class="bp">self</span><span class="o">.</span><span class="n">config</span> <span class="ow">is</span> <span class="ow">not</span> <span class="kc">None</span> <span class="c1"># mypy</span>
- <span class="bp">self</span><span class="o">.</span><span class="n">command_patterns</span> <span class="o">=</span> <span class="nb">dict</span><span class="p">()</span>
- <span class="k">for</span> <span class="n">command</span> <span class="ow">in</span> <span class="bp">self</span><span class="o">.</span><span class="n">config</span><span class="o">.</span><span class="n">_commands</span><span class="p">:</span>
- <span class="k">if</span> <span class="n">command</span><span class="o">.</span><span class="n">end_name</span> <span class="ow">is</span> <span class="ow">not</span> <span class="kc">None</span><span class="p">:</span>
- <span class="n">pat</span> <span class="o">=</span> <span class="n">re</span><span class="o">.</span><span class="n">compile</span><span class="p">(</span>
- <span class="sa">rf</span><span class="s2">"^\s*(</span><span class="si">{</span><span class="n">command</span><span class="o">.</span><span class="n">name</span><span class="si">}</span><span class="s2">)\s*(.*?)^(</span><span class="si">{</span><span class="n">command</span><span class="o">.</span><span class="n">end_name</span><span class="si">}</span><span class="s2">)\s*$"</span><span class="p">,</span>
- <span class="n">re</span><span class="o">.</span><span class="n">DOTALL</span> <span class="o">|</span> <span class="n">re</span><span class="o">.</span><span class="n">MULTILINE</span><span class="p">,</span>
- <span class="p">)</span>
- <span class="bp">self</span><span class="o">.</span><span class="n">command_patterns</span><span class="p">[</span><span class="n">command</span><span class="o">.</span><span class="n">name</span><span class="p">]</span> <span class="o">=</span> <span class="n">pat</span>
- <span class="k">else</span><span class="p">:</span>
- <span class="n">pat</span> <span class="o">=</span> <span class="n">re</span><span class="o">.</span><span class="n">compile</span><span class="p">(</span><span class="sa">rf</span><span class="s2">"^\s*(</span><span class="si">{</span><span class="n">command</span><span class="o">.</span><span class="n">name</span><span class="si">}</span><span class="s2">)\s*(.*?)$"</span><span class="p">,</span> <span class="n">re</span><span class="o">.</span><span class="n">MULTILINE</span><span class="p">)</span>
- <span class="bp">self</span><span class="o">.</span><span class="n">command_patterns</span><span class="p">[</span><span class="n">command</span><span class="o">.</span><span class="n">name</span><span class="p">]</span> <span class="o">=</span> <span class="n">pat</span>
- <span class="bp">self</span><span class="o">.</span><span class="n">subroutine_patterns</span> <span class="o">=</span> <span class="nb">dict</span><span class="p">()</span>
- <span class="k">for</span> <span class="n">_</span><span class="p">,</span> <span class="n">subroutine</span> <span class="ow">in</span> <span class="bp">self</span><span class="o">.</span><span class="n">config</span><span class="o">.</span><span class="n">_subroutines</span><span class="o">.</span><span class="n">items</span><span class="p">():</span>
- <span class="k">if</span> <span class="n">subroutine</span><span class="o">.</span><span class="n">end_name</span> <span class="ow">is</span> <span class="kc">None</span><span class="p">:</span>
- <span class="n">pat</span> <span class="o">=</span> <span class="n">re</span><span class="o">.</span><span class="n">compile</span><span class="p">(</span><span class="sa">rf</span><span class="s2">"^\s*(</span><span class="si">{</span><span class="n">subroutine</span><span class="o">.</span><span class="n">name</span><span class="si">}</span><span class="s2">)\s*(.*?)$"</span><span class="p">,</span> <span class="n">re</span><span class="o">.</span><span class="n">MULTILINE</span><span class="p">)</span>
- <span class="bp">self</span><span class="o">.</span><span class="n">subroutine_patterns</span><span class="p">[</span><span class="n">subroutine</span><span class="o">.</span><span class="n">name</span><span class="p">,]</span> <span class="o">=</span> <span class="n">pat</span>
- <span class="k">else</span><span class="p">:</span>
- <span class="n">pat</span> <span class="o">=</span> <span class="n">re</span><span class="o">.</span><span class="n">compile</span><span class="p">(</span>
- <span class="sa">rf</span><span class="s2">"^\s*(</span><span class="si">{</span><span class="n">subroutine</span><span class="o">.</span><span class="n">name</span><span class="si">}</span><span class="s2">)\s*(.*?)^(</span><span class="si">{</span><span class="n">subroutine</span><span class="o">.</span><span class="n">end_name</span><span class="si">}</span><span class="s2">)\s*$"</span><span class="p">,</span>
- <span class="n">re</span><span class="o">.</span><span class="n">DOTALL</span> <span class="o">|</span> <span class="n">re</span><span class="o">.</span><span class="n">MULTILINE</span><span class="p">,</span>
- <span class="p">)</span>
- <span class="bp">self</span><span class="o">.</span><span class="n">subroutine_patterns</span><span class="p">[</span><span class="n">subroutine</span><span class="o">.</span><span class="n">name</span><span class="p">]</span> <span class="o">=</span> <span class="n">pat</span>
- <span class="k">if</span> <span class="nb">hasattr</span><span class="p">(</span><span class="bp">self</span><span class="o">.</span><span class="n">config</span><span class="p">,</span> <span class="s2">"submit_command_end_name"</span><span class="p">):</span>
- <span class="n">submit_pat</span> <span class="o">=</span> <span class="n">re</span><span class="o">.</span><span class="n">compile</span><span class="p">(</span>
- <span class="sa">rf</span><span class="s2">"^\s*(</span><span class="si">{</span><span class="bp">self</span><span class="o">.</span><span class="n">config</span><span class="o">.</span><span class="n">submit_command</span><span class="si">}</span><span class="s2">)\s*(.*?)^(</span><span class="si">{</span><span class="bp">self</span><span class="o">.</span><span class="n">config</span><span class="o">.</span><span class="n">submit_command_end_name</span><span class="si">}</span><span class="s2">)\s*$"</span><span class="p">,</span>
- <span class="n">re</span><span class="o">.</span><span class="n">DOTALL</span> <span class="o">|</span> <span class="n">re</span><span class="o">.</span><span class="n">MULTILINE</span><span class="p">,</span>
- <span class="p">)</span>
- <span class="k">else</span><span class="p">:</span>
- <span class="n">submit_pat</span> <span class="o">=</span> <span class="n">re</span><span class="o">.</span><span class="n">compile</span><span class="p">(</span><span class="sa">rf</span><span class="s2">"^\s*(</span><span class="si">{</span><span class="bp">self</span><span class="o">.</span><span class="n">config</span><span class="o">.</span><span class="n">submit_command</span><span class="si">}</span><span class="s2">)(\s*)$"</span><span class="p">,</span> <span class="n">re</span><span class="o">.</span><span class="n">MULTILINE</span><span class="p">)</span> <span class="c1"># group 2 is nothing</span>
- <span class="bp">self</span><span class="o">.</span><span class="n">subroutine_patterns</span><span class="p">[</span><span class="bp">self</span><span class="o">.</span><span class="n">config</span><span class="o">.</span><span class="n">submit_command</span><span class="p">]</span> <span class="o">=</span> <span class="n">submit_pat</span>
- <span class="bp">self</span><span class="o">.</span><span class="n">command_patterns</span><span class="p">[</span><span class="bp">self</span><span class="o">.</span><span class="n">config</span><span class="o">.</span><span class="n">submit_command</span><span class="p">]</span> <span class="o">=</span> <span class="n">submit_pat</span>
- <span class="k">def</span> <span class="nf">forward</span><span class="p">(</span><span class="bp">self</span><span class="p">,</span> <span class="n">observation</span><span class="p">:</span> <span class="nb">str</span> <span class="o">|</span> <span class="kc">None</span><span class="p">,</span> <span class="n">available_actions</span><span class="p">:</span> <span class="nb">list</span><span class="p">[</span><span class="nb">str</span><span class="p">],</span> <span class="n">state</span><span class="p">:</span> <span class="nb">str</span><span class="p">)</span> <span class="o">-></span> <span class="nb">tuple</span><span class="p">[</span><span class="nb">str</span><span class="p">,</span> <span class="nb">str</span><span class="p">,</span> <span class="nb">str</span><span class="p">]:</span>
- <span class="w"> </span><span class="sd">"""Forwards the model</span>
- <span class="sd"> Args:</span>
- <span class="sd"> observation: Observation</span>
- <span class="sd"> available_actions: Currently not used</span>
- <span class="sd"> state:</span>
- <span class="sd"> Returns:</span>
- <span class="sd"> thought: model reasoning</span>
- <span class="sd"> action: action that the model proposes</span>
- <span class="sd"> output: raw model output (not output of the action)</span>
- <span class="sd"> """</span>
- <span class="n">thought</span><span class="p">,</span> <span class="n">action</span><span class="p">,</span> <span class="n">output</span> <span class="o">=</span> <span class="bp">self</span><span class="o">.</span><span class="n">forward_with_error_check</span><span class="p">(</span><span class="n">observation</span><span class="p">,</span> <span class="n">state</span><span class="p">)</span>
- <span class="bp">self</span><span class="o">.</span><span class="n">_append_history</span><span class="p">(</span>
- <span class="p">{</span>
- <span class="s2">"role"</span><span class="p">:</span> <span class="s2">"assistant"</span><span class="p">,</span>
- <span class="s2">"content"</span><span class="p">:</span> <span class="n">output</span><span class="p">,</span>
- <span class="s2">"thought"</span><span class="p">:</span> <span class="n">thought</span><span class="p">,</span>
- <span class="s2">"action"</span><span class="p">:</span> <span class="n">action</span><span class="p">,</span>
- <span class="s2">"agent"</span><span class="p">:</span> <span class="bp">self</span><span class="o">.</span><span class="n">name</span><span class="p">,</span>
- <span class="p">},</span>
- <span class="p">)</span>
- <span class="bp">self</span><span class="o">.</span><span class="n">logger</span><span class="o">.</span><span class="n">info</span><span class="p">(</span><span class="sa">f</span><span class="s2">"💭 THOUGHT (</span><span class="si">{</span><span class="bp">self</span><span class="o">.</span><span class="n">name</span><span class="si">}</span><span class="s2">)</span><span class="se">\n</span><span class="si">{</span><span class="n">thought</span><span class="si">}</span><span class="s2">"</span><span class="p">)</span>
- <span class="bp">self</span><span class="o">.</span><span class="n">logger</span><span class="o">.</span><span class="n">info</span><span class="p">(</span><span class="sa">f</span><span class="s2">"🎬 ACTION (</span><span class="si">{</span><span class="bp">self</span><span class="o">.</span><span class="n">name</span><span class="si">}</span><span class="s2">)</span><span class="se">\n</span><span class="si">{</span><span class="n">action</span><span class="si">}</span><span class="s2">"</span><span class="p">)</span>
- <span class="k">return</span> <span class="n">thought</span><span class="p">,</span> <span class="n">action</span><span class="p">,</span> <span class="n">output</span>
- <span class="k">def</span> <span class="nf">forward_model</span><span class="p">(</span><span class="bp">self</span><span class="p">,</span> <span class="n">observation</span><span class="p">:</span> <span class="nb">str</span> <span class="o">|</span> <span class="kc">None</span><span class="p">,</span> <span class="n">state</span><span class="p">:</span> <span class="nb">str</span><span class="p">)</span> <span class="o">-></span> <span class="nb">str</span><span class="p">:</span>
- <span class="w"> </span><span class="sd">"""Query the model with the current state and observation with the appropriate template.</span>
- <span class="sd"> Returns:</span>
- <span class="sd"> output: raw model output (not output of the command)</span>
- <span class="sd"> """</span>
- <span class="k">assert</span> <span class="bp">self</span><span class="o">.</span><span class="n">config</span> <span class="ow">is</span> <span class="ow">not</span> <span class="kc">None</span> <span class="c1"># mypy</span>
- <span class="k">try</span><span class="p">:</span>
- <span class="n">state_vars</span> <span class="o">=</span> <span class="n">json</span><span class="o">.</span><span class="n">loads</span><span class="p">(</span><span class="n">state</span><span class="p">)</span>
- <span class="k">except</span> <span class="n">json</span><span class="o">.</span><span class="n">JSONDecodeError</span> <span class="k">as</span> <span class="n">e</span><span class="p">:</span>
- <span class="n">msg</span> <span class="o">=</span> <span class="sa">f</span><span class="s2">"State </span><span class="si">{</span><span class="n">state</span><span class="si">!r}</span><span class="s2"> is not valid json. This is an internal error, please report it."</span>
- <span class="k">raise</span> <span class="ne">ValueError</span><span class="p">(</span><span class="n">msg</span><span class="p">)</span> <span class="kn">from</span> <span class="nn">e</span>
- <span class="n">templates</span><span class="p">:</span> <span class="nb">list</span><span class="p">[</span><span class="nb">str</span><span class="p">]</span> <span class="o">=</span> <span class="p">[]</span>
- <span class="c1"># Determine observation template based on what prior observation was</span>
- <span class="k">if</span> <span class="bp">self</span><span class="o">.</span><span class="n">history</span><span class="p">[</span><span class="o">-</span><span class="mi">1</span><span class="p">][</span><span class="s2">"role"</span><span class="p">]</span> <span class="o">==</span> <span class="s2">"system"</span> <span class="ow">or</span> <span class="bp">self</span><span class="o">.</span><span class="n">history</span><span class="p">[</span><span class="o">-</span><span class="mi">1</span><span class="p">]</span><span class="o">.</span><span class="n">get</span><span class="p">(</span><span class="s2">"is_demo"</span><span class="p">,</span> <span class="kc">False</span><span class="p">):</span>
- <span class="c1"># Show instance template if prev. obs. was initial system message</span>
- <span class="n">templates</span> <span class="o">=</span> <span class="p">[</span><span class="bp">self</span><span class="o">.</span><span class="n">config</span><span class="o">.</span><span class="n">instance_template</span><span class="p">]</span>
- <span class="k">if</span> <span class="bp">self</span><span class="o">.</span><span class="n">config</span><span class="o">.</span><span class="n">strategy_template</span> <span class="ow">is</span> <span class="ow">not</span> <span class="kc">None</span><span class="p">:</span>
- <span class="n">templates</span><span class="o">.</span><span class="n">append</span><span class="p">(</span><span class="bp">self</span><span class="o">.</span><span class="n">config</span><span class="o">.</span><span class="n">strategy_template</span><span class="p">)</span>
- <span class="k">elif</span> <span class="n">observation</span> <span class="ow">is</span> <span class="kc">None</span> <span class="ow">or</span> <span class="n">observation</span><span class="o">.</span><span class="n">strip</span><span class="p">()</span> <span class="o">==</span> <span class="s2">""</span><span class="p">:</span>
- <span class="c1"># Show no output template if observation content was empty</span>
- <span class="n">templates</span> <span class="o">=</span> <span class="p">[</span><span class="bp">self</span><span class="o">.</span><span class="n">config</span><span class="o">.</span><span class="n">next_step_no_output_template</span><span class="p">]</span>
- <span class="k">else</span><span class="p">:</span>
- <span class="c1"># Show standard output template if there is observation content</span>
- <span class="n">templates</span> <span class="o">=</span> <span class="p">[</span><span class="bp">self</span><span class="o">.</span><span class="n">config</span><span class="o">.</span><span class="n">next_step_template</span><span class="p">]</span>
- <span class="c1"># Populate selected template(s) with information (e.g., issue, arguments, state)</span>
- <span class="n">messages</span> <span class="o">=</span> <span class="p">[]</span>
- <span class="k">for</span> <span class="n">template</span> <span class="ow">in</span> <span class="n">templates</span><span class="p">:</span>
- <span class="n">messages</span><span class="o">.</span><span class="n">append</span><span class="p">(</span>
- <span class="n">template</span><span class="o">.</span><span class="n">format</span><span class="p">(</span>
- <span class="o">**</span><span class="bp">self</span><span class="o">.</span><span class="n">instance_args</span><span class="p">,</span>
- <span class="o">**</span><span class="bp">self</span><span class="o">.</span><span class="n">system_args</span><span class="p">,</span>
- <span class="o">**</span><span class="n">state_vars</span><span class="p">,</span>
- <span class="n">observation</span><span class="o">=</span><span class="p">(</span><span class="n">observation</span> <span class="k">if</span> <span class="n">observation</span> <span class="ow">is</span> <span class="ow">not</span> <span class="kc">None</span> <span class="k">else</span> <span class="s2">""</span><span class="p">),</span>
- <span class="o">**</span><span class="bp">self</span><span class="o">.</span><span class="n">_forwarded_vars</span><span class="p">,</span>
- <span class="p">),</span>
- <span class="p">)</span>
- <span class="n">message</span> <span class="o">=</span> <span class="s2">"</span><span class="se">\n</span><span class="s2">"</span><span class="o">.</span><span class="n">join</span><span class="p">(</span><span class="n">messages</span><span class="p">)</span>
- <span class="bp">self</span><span class="o">.</span><span class="n">logger</span><span class="o">.</span><span class="n">info</span><span class="p">(</span><span class="sa">f</span><span class="s2">"🤖 MODEL INPUT</span><span class="se">\n</span><span class="si">{</span><span class="n">message</span><span class="si">}</span><span class="s2">"</span><span class="p">)</span>
- <span class="bp">self</span><span class="o">.</span><span class="n">_append_history</span><span class="p">({</span><span class="s2">"role"</span><span class="p">:</span> <span class="s2">"user"</span><span class="p">,</span> <span class="s2">"content"</span><span class="p">:</span> <span class="n">message</span><span class="p">,</span> <span class="s2">"agent"</span><span class="p">:</span> <span class="bp">self</span><span class="o">.</span><span class="n">name</span><span class="p">})</span>
- <span class="k">for</span> <span class="n">hook</span> <span class="ow">in</span> <span class="bp">self</span><span class="o">.</span><span class="n">hooks</span><span class="p">:</span>
- <span class="n">hook</span><span class="o">.</span><span class="n">on_model_query</span><span class="p">(</span><span class="n">query</span><span class="o">=</span><span class="bp">self</span><span class="o">.</span><span class="n">local_history</span><span class="p">,</span> <span class="n">agent</span><span class="o">=</span><span class="bp">self</span><span class="o">.</span><span class="n">name</span><span class="p">)</span>
- <span class="k">return</span> <span class="bp">self</span><span class="o">.</span><span class="n">model</span><span class="o">.</span><span class="n">query</span><span class="p">(</span><span class="bp">self</span><span class="o">.</span><span class="n">local_history</span><span class="p">)</span>
- <span class="k">def</span> <span class="nf">retry_after_format_fail</span><span class="p">(</span><span class="bp">self</span><span class="p">,</span> <span class="n">output</span><span class="p">:</span> <span class="nb">str</span><span class="p">)</span> <span class="o">-></span> <span class="nb">str</span><span class="p">:</span>
- <span class="w"> </span><span class="sd">"""Ask the model to correct (without committing to persistent history) after a malformatted model output"""</span>
- <span class="n">format_error_template</span> <span class="o">=</span> <span class="bp">self</span><span class="o">.</span><span class="n">config</span><span class="o">.</span><span class="n">format_error_template</span>
- <span class="bp">self</span><span class="o">.</span><span class="n">logger</span><span class="o">.</span><span class="n">warning</span><span class="p">(</span><span class="sa">f</span><span class="s2">"MALFORMED OUTPUT</span><span class="se">\n</span><span class="si">{</span><span class="n">output</span><span class="si">}</span><span class="s2">"</span><span class="p">)</span>
- <span class="bp">self</span><span class="o">.</span><span class="n">logger</span><span class="o">.</span><span class="n">warning</span><span class="p">(</span><span class="sa">f</span><span class="s2">"FORMAT ERROR</span><span class="se">\n</span><span class="si">{</span><span class="n">format_error_template</span><span class="si">}</span><span class="s2">"</span><span class="p">)</span>
- <span class="n">temp_history</span> <span class="o">=</span> <span class="bp">self</span><span class="o">.</span><span class="n">local_history</span> <span class="o">+</span> <span class="p">[</span>
- <span class="p">{</span><span class="s2">"role"</span><span class="p">:</span> <span class="s2">"assistant"</span><span class="p">,</span> <span class="s2">"content"</span><span class="p">:</span> <span class="n">output</span><span class="p">,</span> <span class="s2">"agent"</span><span class="p">:</span> <span class="bp">self</span><span class="o">.</span><span class="n">name</span><span class="p">},</span>
- <span class="p">{</span><span class="s2">"role"</span><span class="p">:</span> <span class="s2">"user"</span><span class="p">,</span> <span class="s2">"content"</span><span class="p">:</span> <span class="n">format_error_template</span><span class="p">,</span> <span class="s2">"agent"</span><span class="p">:</span> <span class="bp">self</span><span class="o">.</span><span class="n">name</span><span class="p">},</span>
- <span class="p">]</span>
- <span class="k">return</span> <span class="bp">self</span><span class="o">.</span><span class="n">model</span><span class="o">.</span><span class="n">query</span><span class="p">(</span><span class="n">temp_history</span><span class="p">)</span>
- <span class="k">def</span> <span class="nf">retry_after_blocklist_fail</span><span class="p">(</span><span class="bp">self</span><span class="p">,</span> <span class="n">output</span><span class="p">:</span> <span class="nb">str</span><span class="p">,</span> <span class="n">action</span><span class="p">:</span> <span class="nb">str</span><span class="p">)</span> <span class="o">-></span> <span class="nb">str</span><span class="p">:</span>
- <span class="w"> </span><span class="sd">"""Ask the model to correct (without committing to persistent history) after a disallowed command"""</span>
- <span class="n">name</span> <span class="o">=</span> <span class="n">action</span><span class="o">.</span><span class="n">strip</span><span class="p">()</span><span class="o">.</span><span class="n">split</span><span class="p">()[</span><span class="mi">0</span><span class="p">]</span>
- <span class="n">blocklist_error_message</span> <span class="o">=</span> <span class="bp">self</span><span class="o">.</span><span class="n">config</span><span class="o">.</span><span class="n">blocklist_error_template</span><span class="o">.</span><span class="n">format</span><span class="p">(</span><span class="n">name</span><span class="o">=</span><span class="n">name</span><span class="p">)</span>
- <span class="bp">self</span><span class="o">.</span><span class="n">logger</span><span class="o">.</span><span class="n">warning</span><span class="p">(</span><span class="sa">f</span><span class="s2">"BLOCKLISTED OUTPUT</span><span class="se">\n</span><span class="si">{</span><span class="n">output</span><span class="si">}</span><span class="s2">"</span><span class="p">)</span>
- <span class="bp">self</span><span class="o">.</span><span class="n">logger</span><span class="o">.</span><span class="n">warning</span><span class="p">(</span><span class="sa">f</span><span class="s2">"BLOCKLIST ERROR</span><span class="se">\n</span><span class="si">{</span><span class="n">blocklist_error_message</span><span class="si">}</span><span class="s2">"</span><span class="p">)</span>
- <span class="n">temp_history</span> <span class="o">=</span> <span class="bp">self</span><span class="o">.</span><span class="n">local_history</span> <span class="o">+</span> <span class="p">[</span>
- <span class="p">{</span><span class="s2">"role"</span><span class="p">:</span> <span class="s2">"assistant"</span><span class="p">,</span> <span class="s2">"content"</span><span class="p">:</span> <span class="n">output</span><span class="p">,</span> <span class="s2">"agent"</span><span class="p">:</span> <span class="bp">self</span><span class="o">.</span><span class="n">name</span><span class="p">},</span>
- <span class="p">{</span><span class="s2">"role"</span><span class="p">:</span> <span class="s2">"user"</span><span class="p">,</span> <span class="s2">"content"</span><span class="p">:</span> <span class="n">blocklist_error_message</span><span class="p">,</span> <span class="s2">"agent"</span><span class="p">:</span> <span class="bp">self</span><span class="o">.</span><span class="n">name</span><span class="p">},</span>
- <span class="p">]</span>
- <span class="k">return</span> <span class="bp">self</span><span class="o">.</span><span class="n">model</span><span class="o">.</span><span class="n">query</span><span class="p">(</span><span class="n">temp_history</span><span class="p">)</span>
- <span class="k">def</span> <span class="nf">should_block_action</span><span class="p">(</span><span class="bp">self</span><span class="p">,</span> <span class="n">action</span><span class="p">:</span> <span class="nb">str</span><span class="p">)</span> <span class="o">-></span> <span class="nb">bool</span><span class="p">:</span>
- <span class="w"> </span><span class="sd">"""Check if the command should be blocked."""</span>
- <span class="n">names</span> <span class="o">=</span> <span class="n">action</span><span class="o">.</span><span class="n">strip</span><span class="p">()</span><span class="o">.</span><span class="n">split</span><span class="p">()</span>
- <span class="k">if</span> <span class="nb">len</span><span class="p">(</span><span class="n">names</span><span class="p">)</span> <span class="o">==</span> <span class="mi">0</span><span class="p">:</span>
- <span class="k">return</span> <span class="kc">False</span>
- <span class="n">name</span> <span class="o">=</span> <span class="n">names</span><span class="p">[</span><span class="mi">0</span><span class="p">]</span>
- <span class="k">if</span> <span class="n">name</span> <span class="ow">in</span> <span class="bp">self</span><span class="o">.</span><span class="n">config</span><span class="o">.</span><span class="n">blocklist</span><span class="p">:</span>
- <span class="k">return</span> <span class="kc">True</span>
- <span class="k">if</span> <span class="n">name</span> <span class="ow">in</span> <span class="bp">self</span><span class="o">.</span><span class="n">config</span><span class="o">.</span><span class="n">blocklist_standalone</span> <span class="ow">and</span> <span class="n">name</span> <span class="o">==</span> <span class="n">action</span><span class="o">.</span><span class="n">strip</span><span class="p">():</span>
- <span class="k">return</span> <span class="kc">True</span>
- <span class="k">if</span> <span class="n">name</span> <span class="ow">in</span> <span class="bp">self</span><span class="o">.</span><span class="n">config</span><span class="o">.</span><span class="n">block_unless_regex</span> <span class="ow">and</span> <span class="ow">not</span> <span class="n">re</span><span class="o">.</span><span class="n">search</span><span class="p">(</span><span class="bp">self</span><span class="o">.</span><span class="n">config</span><span class="o">.</span><span class="n">block_unless_regex</span><span class="p">[</span><span class="n">name</span><span class="p">],</span> <span class="n">action</span><span class="p">):</span>
- <span class="k">return</span> <span class="kc">True</span>
- <span class="k">return</span> <span class="kc">False</span>
- <span class="k">def</span> <span class="nf">check_format_and_requery</span><span class="p">(</span>
- <span class="bp">self</span><span class="p">,</span>
- <span class="n">output</span><span class="p">:</span> <span class="nb">str</span><span class="p">,</span>
- <span class="p">)</span> <span class="o">-></span> <span class="nb">tuple</span><span class="p">[</span><span class="nb">str</span><span class="p">,</span> <span class="nb">str</span><span class="p">,</span> <span class="nb">str</span><span class="p">]:</span>
- <span class="w"> </span><span class="sd">"""Query the model with the current state and observation with the appropriate template.</span>
- <span class="sd"> Try to parse the output into a thought and action. Retry if the output is malformatted or the action is blocked.</span>
- <span class="sd"> Returns:</span>
- <span class="sd"> thought: model reasoning</span>
- <span class="sd"> action: action that the model proposes</span>
- <span class="sd"> output: raw model output</span>
- <span class="sd"> """</span>
- <span class="c1"># Condition for handling outputs with no thought (just action)</span>
- <span class="k">if</span> <span class="bp">self</span><span class="o">.</span><span class="n">model</span><span class="o">.</span><span class="n">args</span><span class="o">.</span><span class="n">model_name</span> <span class="o">==</span> <span class="s2">"human"</span><span class="p">:</span>
- <span class="k">return</span> <span class="s2">""</span><span class="p">,</span> <span class="n">output</span><span class="p">,</span> <span class="n">output</span>
- <span class="k">elif</span> <span class="bp">self</span><span class="o">.</span><span class="n">model</span><span class="o">.</span><span class="n">args</span><span class="o">.</span><span class="n">model_name</span> <span class="o">==</span> <span class="s2">"human_thought"</span><span class="p">:</span>
- <span class="n">thought</span><span class="p">,</span> <span class="n">action</span> <span class="o">=</span> <span class="n">ParseFunction</span><span class="o">.</span><span class="n">get</span><span class="p">(</span><span class="s2">"ThoughtActionParser"</span><span class="p">)(</span>
- <span class="n">output</span><span class="p">,</span>
- <span class="bp">self</span><span class="o">.</span><span class="n">config</span><span class="o">.</span><span class="n">_commands</span> <span class="o">+</span> <span class="bp">self</span><span class="o">.</span><span class="n">config</span><span class="o">.</span><span class="n">subroutine_types</span><span class="p">,</span>
- <span class="n">strict</span><span class="o">=</span><span class="kc">False</span><span class="p">,</span>
- <span class="p">)</span>
- <span class="k">return</span> <span class="n">thought</span><span class="p">,</span> <span class="n">action</span><span class="p">,</span> <span class="n">output</span>
- <span class="n">format_fails</span> <span class="o">=</span> <span class="n">blocklist_fails</span> <span class="o">=</span> <span class="mi">0</span>
- <span class="k">while</span> <span class="n">format_fails</span> <span class="o">+</span> <span class="n">blocklist_fails</span> <span class="o"><=</span> <span class="mi">2</span><span class="p">:</span>
- <span class="k">try</span><span class="p">:</span>
- <span class="n">thought</span><span class="p">,</span> <span class="n">action</span> <span class="o">=</span> <span class="bp">self</span><span class="o">.</span><span class="n">config</span><span class="o">.</span><span class="n">parse_function</span><span class="p">(</span>
- <span class="n">output</span><span class="p">,</span>
- <span class="bp">self</span><span class="o">.</span><span class="n">config</span><span class="o">.</span><span class="n">_commands</span> <span class="o">+</span> <span class="bp">self</span><span class="o">.</span><span class="n">config</span><span class="o">.</span><span class="n">subroutine_types</span><span class="p">,</span>
- <span class="n">strict</span><span class="o">=</span><span class="kc">False</span><span class="p">,</span>
- <span class="p">)</span>
- <span class="k">except</span> <span class="ne">KeyboardInterrupt</span><span class="p">:</span>
- <span class="k">raise</span>
- <span class="k">except</span> <span class="n">FormatError</span><span class="p">:</span>
- <span class="n">format_fails</span> <span class="o">+=</span> <span class="mi">1</span>
- <span class="n">output</span> <span class="o">=</span> <span class="bp">self</span><span class="o">.</span><span class="n">retry_after_format_fail</span><span class="p">(</span><span class="n">output</span><span class="p">)</span>
- <span class="k">continue</span>
- <span class="k">if</span> <span class="bp">self</span><span class="o">.</span><span class="n">should_block_action</span><span class="p">(</span><span class="n">action</span><span class="p">):</span>
- <span class="n">blocklist_fails</span> <span class="o">+=</span> <span class="mi">1</span>
- <span class="n">output</span> <span class="o">=</span> <span class="bp">self</span><span class="o">.</span><span class="n">retry_after_blocklist_fail</span><span class="p">(</span><span class="n">output</span><span class="p">,</span> <span class="n">action</span><span class="p">)</span>
- <span class="k">else</span><span class="p">:</span>
- <span class="k">return</span> <span class="n">thought</span><span class="p">,</span> <span class="n">action</span><span class="p">,</span> <span class="n">output</span>
- <span class="bp">self</span><span class="o">.</span><span class="n">logger</span><span class="o">.</span><span class="n">warning</span><span class="p">(</span><span class="sa">f</span><span class="s2">"Malformat limit reached: </span><span class="se">\n</span><span class="si">{</span><span class="n">output</span><span class="si">}</span><span class="s2">"</span><span class="p">)</span>
- <span class="k">return</span> <span class="s2">"Exit due to format error"</span><span class="p">,</span> <span class="s2">"exit_format"</span><span class="p">,</span> <span class="n">output</span>
- <span class="k">def</span> <span class="nf">forward_with_error_check</span><span class="p">(</span><span class="bp">self</span><span class="p">,</span> <span class="n">observation</span><span class="p">:</span> <span class="nb">str</span> <span class="o">|</span> <span class="kc">None</span><span class="p">,</span> <span class="n">state</span><span class="p">:</span> <span class="nb">str</span><span class="p">)</span> <span class="o">-></span> <span class="nb">tuple</span><span class="p">[</span><span class="nb">str</span><span class="p">,</span> <span class="nb">str</span><span class="p">,</span> <span class="nb">str</span><span class="p">]:</span>
- <span class="w"> </span><span class="sd">"""Wrapper around `self.forward_model` that handles errors and retries</span>
- <span class="sd"> due to format errors or blocked actions.</span>
- <span class="sd"> Returns:</span>
- <span class="sd"> thought: model reasoning</span>
- <span class="sd"> action: action that the model proposes</span>
- <span class="sd"> output: raw model output</span>
- <span class="sd"> """</span>
- <span class="k">try</span><span class="p">:</span>
- <span class="k">return</span> <span class="bp">self</span><span class="o">.</span><span class="n">check_format_and_requery</span><span class="p">(</span><span class="bp">self</span><span class="o">.</span><span class="n">forward_model</span><span class="p">(</span><span class="n">observation</span><span class="p">,</span> <span class="n">state</span><span class="p">))</span>
- <span class="k">except</span> <span class="ne">KeyboardInterrupt</span><span class="p">:</span>
- <span class="k">raise</span>
- <span class="k">except</span> <span class="ne">RuntimeError</span> <span class="k">as</span> <span class="n">e</span><span class="p">:</span>
- <span class="bp">self</span><span class="o">.</span><span class="n">logger</span><span class="o">.</span><span class="n">warning</span><span class="p">(</span><span class="sa">f</span><span class="s2">"Runtime error: </span><span class="si">{</span><span class="n">e</span><span class="si">}</span><span class="s2">"</span><span class="p">)</span>
- <span class="k">return</span> <span class="p">(</span>
- <span class="sa">f</span><span class="s2">"Exit due to runtime error: </span><span class="si">{</span><span class="n">e</span><span class="si">}</span><span class="s2">"</span><span class="p">,</span>
- <span class="s2">"exit_error"</span><span class="p">,</span>
- <span class="sa">f</span><span class="s2">"exit due to runtime error: </span><span class="si">{</span><span class="n">e</span><span class="si">}</span><span class="s2">"</span><span class="p">,</span>
- <span class="p">)</span>
- <span class="k">except</span> <span class="n">ContextWindowExceededError</span><span class="p">:</span>
- <span class="bp">self</span><span class="o">.</span><span class="n">logger</span><span class="o">.</span><span class="n">warning</span><span class="p">(</span><span class="s2">"Context window exceeded"</span><span class="p">)</span>
- <span class="k">return</span> <span class="s2">"Exit due to context window"</span><span class="p">,</span> <span class="s2">"exit_context"</span><span class="p">,</span> <span class="s2">"Exit due to context window"</span>
- <span class="k">except</span> <span class="n">CostLimitExceededError</span><span class="p">:</span>
- <span class="bp">self</span><span class="o">.</span><span class="n">logger</span><span class="o">.</span><span class="n">warning</span><span class="p">(</span><span class="s2">"Cost limit exceeded"</span><span class="p">)</span>
- <span class="k">return</span> <span class="s2">"Exit due to cost limit"</span><span class="p">,</span> <span class="s2">"exit_cost"</span><span class="p">,</span> <span class="s2">"Exit due to cost limit"</span>
- <span class="k">except</span> <span class="n">RetryError</span> <span class="k">as</span> <span class="n">e</span><span class="p">:</span>
- <span class="bp">self</span><span class="o">.</span><span class="n">logger</span><span class="o">.</span><span class="n">warning</span><span class="p">(</span><span class="sa">f</span><span class="s2">"Retry error: </span><span class="si">{</span><span class="n">e</span><span class="si">}</span><span class="s2">"</span><span class="p">)</span>
- <span class="k">return</span> <span class="p">(</span>
- <span class="sa">f</span><span class="s2">"Exit due to retry error: </span><span class="si">{</span><span class="n">e</span><span class="si">}</span><span class="s2">"</span><span class="p">,</span>
- <span class="s2">"exit_api"</span><span class="p">,</span>
- <span class="sa">f</span><span class="s2">"exit due to retry error: </span><span class="si">{</span><span class="n">e</span><span class="si">}</span><span class="s2">"</span><span class="p">,</span>
- <span class="p">)</span>
- <span class="k">def</span> <span class="nf">init_environment_vars</span><span class="p">(</span><span class="bp">self</span><span class="p">,</span> <span class="n">env</span><span class="p">:</span> <span class="n">SWEEnv</span><span class="p">):</span>
- <span class="k">assert</span> <span class="bp">self</span><span class="o">.</span><span class="n">config</span> <span class="ow">is</span> <span class="ow">not</span> <span class="kc">None</span>
- <span class="bp">self</span><span class="o">.</span><span class="n">set_environment_vars</span><span class="p">(</span><span class="n">env</span><span class="p">,</span> <span class="bp">self</span><span class="o">.</span><span class="n">config</span><span class="o">.</span><span class="n">env_variables</span><span class="p">)</span>
- <span class="k">def</span> <span class="nf">set_environment_vars</span><span class="p">(</span><span class="bp">self</span><span class="p">,</span> <span class="n">env</span><span class="p">:</span> <span class="n">SWEEnv</span><span class="p">,</span> <span class="n">env_variables</span><span class="p">:</span> <span class="nb">dict</span><span class="p">[</span><span class="nb">str</span><span class="p">,</span> <span class="n">Any</span><span class="p">])</span> <span class="o">-></span> <span class="kc">None</span><span class="p">:</span>
- <span class="w"> </span><span class="sd">"""Sets environment variables in the container and for example makes sure</span>
- <span class="sd"> that all the commands are available in the PATH on the container.</span>
- <span class="sd"> """</span>
- <span class="k">assert</span> <span class="bp">self</span><span class="o">.</span><span class="n">config</span> <span class="ow">is</span> <span class="ow">not</span> <span class="kc">None</span> <span class="c1"># mypy</span>
- <span class="n">commands_to_execute</span> <span class="o">=</span> <span class="p">(</span>
- <span class="p">[</span><span class="bp">self</span><span class="o">.</span><span class="n">config</span><span class="o">.</span><span class="n">state_command</span><span class="o">.</span><span class="n">code</span><span class="p">]</span>
- <span class="o">+</span>
- <span class="c1"># [code for code in self.config.util_functions] +</span>
- <span class="c1"># [command.code for command in self.config._commands] +</span>
- <span class="p">[</span><span class="sa">f</span><span class="s2">"</span><span class="si">{</span><span class="n">k</span><span class="si">}</span><span class="s2">=</span><span class="si">{</span><span class="n">v</span><span class="si">}</span><span class="s2">"</span> <span class="k">for</span> <span class="n">k</span><span class="p">,</span> <span class="n">v</span> <span class="ow">in</span> <span class="n">env_variables</span><span class="o">.</span><span class="n">items</span><span class="p">()]</span>
- <span class="p">)</span>
- <span class="n">commands</span> <span class="o">=</span> <span class="s2">"</span><span class="se">\n</span><span class="s2">"</span><span class="o">.</span><span class="n">join</span><span class="p">(</span><span class="n">commands_to_execute</span><span class="p">)</span>
- <span class="k">try</span><span class="p">:</span>
- <span class="n">output</span> <span class="o">=</span> <span class="n">env</span><span class="o">.</span><span class="n">communicate</span><span class="p">(</span><span class="n">commands</span><span class="p">)</span>
- <span class="k">if</span> <span class="n">env</span><span class="o">.</span><span class="n">returncode</span> <span class="o">!=</span> <span class="mi">0</span><span class="p">:</span>
- <span class="n">msg</span> <span class="o">=</span> <span class="sa">f</span><span class="s2">"Nonzero return code: </span><span class="si">{</span><span class="n">env</span><span class="o">.</span><span class="n">returncode</span><span class="si">}</span><span class="se">\n</span><span class="s2">Output: </span><span class="si">{</span><span class="n">output</span><span class="si">}</span><span class="s2">"</span>
- <span class="k">raise</span> <span class="ne">RuntimeError</span><span class="p">(</span><span class="n">msg</span><span class="p">)</span>
- <span class="k">except</span> <span class="ne">KeyboardInterrupt</span><span class="p">:</span>
- <span class="k">raise</span>
- <span class="k">except</span> <span class="ne">Exception</span> <span class="k">as</span> <span class="n">e</span><span class="p">:</span>
- <span class="bp">self</span><span class="o">.</span><span class="n">logger</span><span class="o">.</span><span class="n">warning</span><span class="p">(</span><span class="sa">f</span><span class="s2">"Failed to set environment variables: </span><span class="si">{</span><span class="n">traceback</span><span class="o">.</span><span class="n">format_exc</span><span class="p">()</span><span class="si">}</span><span class="s2">"</span><span class="p">)</span>
- <span class="k">raise</span> <span class="n">e</span>
- <span class="n">command_files</span> <span class="o">=</span> <span class="nb">list</span><span class="p">()</span>
- <span class="k">for</span> <span class="n">file</span> <span class="ow">in</span> <span class="bp">self</span><span class="o">.</span><span class="n">config</span><span class="o">.</span><span class="n">command_files</span><span class="p">:</span>
- <span class="n">datum</span> <span class="o">=</span> <span class="nb">dict</span><span class="p">()</span>
- <span class="k">with</span> <span class="nb">open</span><span class="p">(</span><span class="n">file</span><span class="p">)</span> <span class="k">as</span> <span class="n">f</span><span class="p">:</span>
- <span class="n">contents</span> <span class="o">=</span> <span class="n">f</span><span class="o">.</span><span class="n">read</span><span class="p">()</span>
- <span class="n">datum</span><span class="p">[</span><span class="s2">"contents"</span><span class="p">]</span> <span class="o">=</span> <span class="n">contents</span>
- <span class="n">filename</span> <span class="o">=</span> <span class="n">Path</span><span class="p">(</span><span class="n">file</span><span class="p">)</span><span class="o">.</span><span class="n">name</span>
- <span class="k">if</span> <span class="ow">not</span> <span class="n">contents</span><span class="o">.</span><span class="n">strip</span><span class="p">()</span><span class="o">.</span><span class="n">startswith</span><span class="p">(</span><span class="s2">"#!"</span><span class="p">):</span>
- <span class="k">if</span> <span class="n">filename</span><span class="o">.</span><span class="n">endswith</span><span class="p">(</span><span class="s2">".sh"</span><span class="p">):</span>
- <span class="c1"># files are sourced, so they are not executable</span>
- <span class="n">datum</span><span class="p">[</span><span class="s2">"name"</span><span class="p">]</span> <span class="o">=</span> <span class="n">Path</span><span class="p">(</span><span class="n">file</span><span class="p">)</span><span class="o">.</span><span class="n">name</span>
- <span class="n">datum</span><span class="p">[</span><span class="s2">"type"</span><span class="p">]</span> <span class="o">=</span> <span class="s2">"source_file"</span>
- <span class="k">elif</span> <span class="n">filename</span><span class="o">.</span><span class="n">startswith</span><span class="p">(</span><span class="s2">"_"</span><span class="p">):</span>
- <span class="c1"># files are sourced, so they are not executable</span>
- <span class="n">datum</span><span class="p">[</span><span class="s2">"name"</span><span class="p">]</span> <span class="o">=</span> <span class="n">Path</span><span class="p">(</span><span class="n">file</span><span class="p">)</span><span class="o">.</span><span class="n">name</span>
- <span class="n">datum</span><span class="p">[</span><span class="s2">"type"</span><span class="p">]</span> <span class="o">=</span> <span class="s2">"utility"</span>
- <span class="k">else</span><span class="p">:</span>
- <span class="n">msg</span> <span class="o">=</span> <span class="p">(</span>
- <span class="sa">f</span><span class="s2">"Non-shell script file </span><span class="si">{</span><span class="n">file</span><span class="si">}</span><span class="s2"> does not start with shebang.</span><span class="se">\n</span><span class="s2">"</span>
- <span class="s2">"Either add a shebang (#!) or change the file extension to .sh if you want to source it.</span><span class="se">\n</span><span class="s2">"</span>
- <span class="s2">"You can override this behavior by adding an underscore to the file name (e.g. _utils.py)."</span>
- <span class="p">)</span>
- <span class="k">raise</span> <span class="ne">ValueError</span><span class="p">(</span><span class="n">msg</span><span class="p">)</span>
- <span class="k">else</span><span class="p">:</span>
- <span class="c1"># scripts are made executable</span>
- <span class="n">datum</span><span class="p">[</span><span class="s2">"name"</span><span class="p">]</span> <span class="o">=</span> <span class="n">Path</span><span class="p">(</span><span class="n">file</span><span class="p">)</span><span class="o">.</span><span class="n">name</span><span class="o">.</span><span class="n">rsplit</span><span class="p">(</span><span class="s2">"."</span><span class="p">,</span> <span class="mi">1</span><span class="p">)[</span><span class="mi">0</span><span class="p">]</span>
- <span class="n">datum</span><span class="p">[</span><span class="s2">"type"</span><span class="p">]</span> <span class="o">=</span> <span class="s2">"script"</span>
- <span class="n">command_files</span><span class="o">.</span><span class="n">append</span><span class="p">(</span><span class="n">datum</span><span class="p">)</span>
- <span class="n">env</span><span class="o">.</span><span class="n">add_commands</span><span class="p">(</span><span class="n">command_files</span><span class="p">)</span>
- <span class="k">def</span> <span class="nf">get_environment_vars</span><span class="p">(</span><span class="bp">self</span><span class="p">,</span> <span class="n">env</span><span class="p">:</span> <span class="n">SWEEnv</span><span class="p">)</span> <span class="o">-></span> <span class="nb">dict</span><span class="p">[</span><span class="nb">str</span><span class="p">,</span> <span class="n">Any</span><span class="p">]:</span>
- <span class="w"> </span><span class="sd">"""Get environment variables inside of the container"""</span>
- <span class="k">assert</span> <span class="bp">self</span><span class="o">.</span><span class="n">config</span> <span class="ow">is</span> <span class="ow">not</span> <span class="kc">None</span> <span class="c1"># mypy</span>
- <span class="n">env_vars</span> <span class="o">=</span> <span class="nb">dict</span><span class="p">()</span>
- <span class="k">for</span> <span class="n">var</span> <span class="ow">in</span> <span class="bp">self</span><span class="o">.</span><span class="n">config</span><span class="o">.</span><span class="n">env_variables</span><span class="p">:</span>
- <span class="n">env_vars</span><span class="p">[</span><span class="n">var</span><span class="p">]</span> <span class="o">=</span> <span class="n">env</span><span class="o">.</span><span class="n">communicate</span><span class="p">(</span><span class="sa">f</span><span class="s2">"echo $</span><span class="si">{</span><span class="n">var</span><span class="si">}</span><span class="s2">"</span><span class="p">)</span><span class="o">.</span><span class="n">strip</span><span class="p">()</span>
- <span class="k">return</span> <span class="n">env_vars</span>
- <span class="k">def</span> <span class="nf">call_subroutine</span><span class="p">(</span><span class="bp">self</span><span class="p">,</span> <span class="n">agent_name</span><span class="p">:</span> <span class="nb">str</span><span class="p">,</span> <span class="n">sub_action</span><span class="p">:</span> <span class="n">SubAction</span><span class="p">,</span> <span class="n">env</span><span class="p">:</span> <span class="n">SWEEnv</span><span class="p">):</span>
- <span class="w"> </span><span class="sd">"""Call subroutine"""</span>
- <span class="k">assert</span> <span class="bp">self</span><span class="o">.</span><span class="n">config</span> <span class="ow">is</span> <span class="ow">not</span> <span class="kc">None</span> <span class="c1"># mypy</span>
- <span class="n">env_vars</span> <span class="o">=</span> <span class="bp">self</span><span class="o">.</span><span class="n">get_environment_vars</span><span class="p">(</span><span class="n">env</span><span class="p">)</span>
- <span class="n">cwd</span> <span class="o">=</span> <span class="n">env</span><span class="o">.</span><span class="n">communicate</span><span class="p">(</span><span class="s2">"pwd -P"</span><span class="p">)</span><span class="o">.</span><span class="n">strip</span><span class="p">()</span>
- <span class="n">init_observation</span> <span class="o">=</span> <span class="bp">self</span><span class="o">.</span><span class="n">config</span><span class="o">.</span><span class="n">_subroutines</span><span class="p">[</span><span class="n">agent_name</span><span class="p">]</span><span class="o">.</span><span class="n">init_observation</span>
- <span class="k">if</span> <span class="n">init_observation</span> <span class="ow">is</span> <span class="ow">not</span> <span class="kc">None</span><span class="p">:</span>
- <span class="n">obs</span><span class="p">,</span> <span class="n">_</span><span class="p">,</span> <span class="n">_</span><span class="p">,</span> <span class="n">_</span> <span class="o">=</span> <span class="n">env</span><span class="o">.</span><span class="n">step</span><span class="p">(</span><span class="n">init_observation</span><span class="o">.</span><span class="n">format</span><span class="p">(</span><span class="n">args</span><span class="o">=</span><span class="n">sub_action</span><span class="p">[</span><span class="s2">"args"</span><span class="p">]))</span>
- <span class="k">else</span><span class="p">:</span>
- <span class="n">obs</span> <span class="o">=</span> <span class="kc">None</span>
- <span class="k">if</span> <span class="n">env</span><span class="o">.</span><span class="n">returncode</span> <span class="o">!=</span> <span class="mi">0</span><span class="p">:</span>
- <span class="bp">self</span><span class="o">.</span><span class="n">_append_history</span><span class="p">(</span><span class="n">HistoryItem</span><span class="p">({</span><span class="s2">"role"</span><span class="p">:</span> <span class="s2">"user"</span><span class="p">,</span> <span class="s2">"content"</span><span class="p">:</span> <span class="n">obs</span><span class="p">,</span> <span class="s2">"agent"</span><span class="p">:</span> <span class="n">agent_name</span><span class="p">}))</span>
- <span class="n">msg</span> <span class="o">=</span> <span class="sa">f</span><span class="s2">"Nonzero return code: </span><span class="si">{</span><span class="n">env</span><span class="o">.</span><span class="n">returncode</span><span class="si">}</span><span class="s2"> for init_observation in </span><span class="si">{</span><span class="n">agent_name</span><span class="si">}</span><span class="s2">.</span><span class="se">\n</span><span class="si">{</span><span class="n">obs</span><span class="si">}</span><span class="s2">"</span>
- <span class="k">raise</span> <span class="ne">RuntimeError</span><span class="p">(</span><span class="n">msg</span><span class="p">)</span>
- <span class="n">return_type</span> <span class="o">=</span> <span class="bp">self</span><span class="o">.</span><span class="n">config</span><span class="o">.</span><span class="n">_subroutines</span><span class="p">[</span><span class="n">agent_name</span><span class="p">]</span><span class="o">.</span><span class="n">return_type</span>
- <span class="n">sub_agent</span> <span class="o">=</span> <span class="n">Agent</span><span class="p">(</span><span class="n">agent_name</span><span class="p">,</span> <span class="bp">self</span><span class="o">.</span><span class="n">config</span><span class="o">.</span><span class="n">_subroutines</span><span class="p">[</span><span class="n">agent_name</span><span class="p">]</span><span class="o">.</span><span class="n">agent_args</span><span class="p">)</span>
- <span class="n">sub_agent_output</span> <span class="o">=</span> <span class="n">sub_agent</span><span class="o">.</span><span class="n">run</span><span class="p">(</span>
- <span class="p">{</span><span class="s2">"issue"</span><span class="p">:</span> <span class="n">sub_action</span><span class="p">[</span><span class="s2">"args"</span><span class="p">]},</span>
- <span class="n">env</span><span class="p">,</span>
- <span class="n">observation</span><span class="o">=</span><span class="n">obs</span><span class="p">,</span>
- <span class="n">return_type</span><span class="o">=</span><span class="n">return_type</span><span class="p">,</span>
- <span class="n">init_model_stats</span><span class="o">=</span><span class="bp">self</span><span class="o">.</span><span class="n">model</span><span class="o">.</span><span class="n">stats</span><span class="p">,</span>
- <span class="p">)</span>
- <span class="bp">self</span><span class="o">.</span><span class="n">history</span> <span class="o">+=</span> <span class="n">sub_agent</span><span class="o">.</span><span class="n">history</span>
- <span class="bp">self</span><span class="o">.</span><span class="n">set_environment_vars</span><span class="p">(</span><span class="n">env</span><span class="p">,</span> <span class="n">env_vars</span><span class="p">)</span>
- <span class="n">env</span><span class="o">.</span><span class="n">communicate</span><span class="p">(</span><span class="sa">f</span><span class="s2">"cd </span><span class="si">{</span><span class="n">cwd</span><span class="si">}</span><span class="s2">"</span><span class="p">)</span>
- <span class="bp">self</span><span class="o">.</span><span class="n">model</span><span class="o">.</span><span class="n">stats</span><span class="o">.</span><span class="n">replace</span><span class="p">(</span><span class="n">sub_agent</span><span class="o">.</span><span class="n">model</span><span class="o">.</span><span class="n">stats</span><span class="p">)</span>
- <span class="k">return</span> <span class="n">sub_agent_output</span>
- <span class="k">def</span> <span class="nf">_update_summarizer_stats</span><span class="p">(</span><span class="bp">self</span><span class="p">,</span> <span class="n">cost</span><span class="p">:</span> <span class="n">APIStats</span><span class="p">):</span>
- <span class="w"> </span><span class="sd">"""Update stats for summarizer"""</span>
- <span class="bp">self</span><span class="o">.</span><span class="n">model</span><span class="o">.</span><span class="n">stats</span> <span class="o">+=</span> <span class="n">cost</span>
- <span class="k">if</span> <span class="s2">"summarizer"</span> <span class="ow">not</span> <span class="ow">in</span> <span class="bp">self</span><span class="o">.</span><span class="n">info</span><span class="p">:</span>
- <span class="bp">self</span><span class="o">.</span><span class="n">info</span><span class="p">[</span><span class="s2">"summarizer"</span><span class="p">]</span> <span class="o">=</span> <span class="p">{</span>
- <span class="s2">"model_stats"</span><span class="p">:</span> <span class="n">APIStats</span><span class="p">()</span><span class="o">.</span><span class="n">to_dict</span><span class="p">(),</span>
- <span class="s2">"n_calls"</span><span class="p">:</span> <span class="mi">0</span><span class="p">,</span>
- <span class="p">}</span>
- <span class="n">total_cost</span> <span class="o">=</span> <span class="n">APIStats</span><span class="p">(</span><span class="o">**</span><span class="bp">self</span><span class="o">.</span><span class="n">info</span><span class="p">[</span><span class="s2">"summarizer"</span><span class="p">][</span><span class="s2">"model_stats"</span><span class="p">])</span>
- <span class="n">total_cost</span> <span class="o">+=</span> <span class="n">cost</span>
- <span class="bp">self</span><span class="o">.</span><span class="n">info</span><span class="p">[</span><span class="s2">"summarizer"</span><span class="p">][</span><span class="s2">"model_stats"</span><span class="p">]</span> <span class="o">=</span> <span class="n">total_cost</span><span class="o">.</span><span class="n">to_dict</span><span class="p">()</span>
- <span class="bp">self</span><span class="o">.</span><span class="n">info</span><span class="p">[</span><span class="s2">"summarizer"</span><span class="p">][</span><span class="s2">"n_calls"</span><span class="p">]</span> <span class="o">+=</span> <span class="mi">1</span>
- <span class="k">def</span> <span class="nf">_run_sub_action</span><span class="p">(</span><span class="bp">self</span><span class="p">,</span> <span class="n">sub_action</span><span class="p">:</span> <span class="n">SubAction</span><span class="p">)</span> <span class="o">-></span> <span class="nb">tuple</span><span class="p">[</span><span class="nb">str</span> <span class="o">|</span> <span class="kc">None</span><span class="p">,</span> <span class="nb">bool</span><span class="p">]:</span>
- <span class="w"> </span><span class="sd">"""Execute a sub-action. If the sub-action is a command, execute it.</span>
- <span class="sd"> If it is a subroutine, call the subroutine.</span>
- <span class="sd"> Returns:</span>
- <span class="sd"> observation: Observation</span>
- <span class="sd"> done: Whether `submit` or another exit reason was called</span>
- <span class="sd"> """</span>
- <span class="k">assert</span> <span class="bp">self</span><span class="o">.</span><span class="n">_env</span> <span class="ow">is</span> <span class="ow">not</span> <span class="kc">None</span>
- <span class="k">assert</span> <span class="bp">self</span><span class="o">.</span><span class="n">config</span> <span class="ow">is</span> <span class="ow">not</span> <span class="kc">None</span>
- <span class="k">if</span> <span class="n">sub_action</span><span class="p">[</span><span class="s2">"agent"</span><span class="p">]</span> <span class="o">==</span> <span class="bp">self</span><span class="o">.</span><span class="n">name</span> <span class="ow">or</span> <span class="n">sub_action</span><span class="p">[</span><span class="s2">"cmd_name"</span><span class="p">]</span> <span class="o">==</span> <span class="bp">self</span><span class="o">.</span><span class="n">config</span><span class="o">.</span><span class="n">submit_command</span><span class="p">:</span>
- <span class="c1"># Normal command, not a subroutine</span>
- <span class="k">for</span> <span class="n">hook</span> <span class="ow">in</span> <span class="bp">self</span><span class="o">.</span><span class="n">hooks</span><span class="p">:</span>
- <span class="n">hook</span><span class="o">.</span><span class="n">on_sub_action_started</span><span class="p">(</span><span class="n">sub_action</span><span class="o">=</span><span class="n">sub_action</span><span class="p">)</span>
- <span class="n">observation</span><span class="p">,</span> <span class="n">_</span><span class="p">,</span> <span class="n">done</span><span class="p">,</span> <span class="n">_info</span> <span class="o">=</span> <span class="bp">self</span><span class="o">.</span><span class="n">_env</span><span class="o">.</span><span class="n">step</span><span class="p">(</span><span class="n">sub_action</span><span class="p">[</span><span class="s2">"action"</span><span class="p">])</span>
- <span class="n">observation</span><span class="p">,</span> <span class="n">additional_cost</span> <span class="o">=</span> <span class="bp">self</span><span class="o">.</span><span class="n">config</span><span class="o">.</span><span class="n">summarizer_config</span><span class="o">.</span><span class="n">function</span><span class="p">(</span> <span class="c1"># type: ignore</span>
- <span class="n">sub_action</span><span class="p">[</span><span class="s2">"action"</span><span class="p">],</span> <span class="n">observation</span><span class="p">,</span> <span class="bp">self</span><span class="o">.</span><span class="n">_env</span><span class="p">,</span> <span class="bp">self</span><span class="o">.</span><span class="n">summarizer_model</span>
- <span class="p">)</span>
- <span class="bp">self</span><span class="o">.</span><span class="n">_update_summarizer_stats</span><span class="p">(</span><span class="n">additional_cost</span><span class="p">)</span>
- <span class="bp">self</span><span class="o">.</span><span class="n">info</span><span class="o">.</span><span class="n">update</span><span class="p">(</span><span class="n">_info</span><span class="p">)</span>
- <span class="k">for</span> <span class="n">hook</span> <span class="ow">in</span> <span class="bp">self</span><span class="o">.</span><span class="n">hooks</span><span class="p">:</span>
- <span class="n">hook</span><span class="o">.</span><span class="n">on_sub_action_executed</span><span class="p">(</span><span class="n">obs</span><span class="o">=</span><span class="n">observation</span><span class="p">,</span> <span class="n">done</span><span class="o">=</span><span class="n">done</span><span class="p">)</span>
- <span class="k">if</span> <span class="n">sub_action</span><span class="p">[</span><span class="s2">"cmd_name"</span><span class="p">]</span> <span class="o">==</span> <span class="bp">self</span><span class="o">.</span><span class="n">config</span><span class="o">.</span><span class="n">submit_command</span><span class="p">:</span>
- <span class="n">done</span> <span class="o">=</span> <span class="kc">True</span>
- <span class="k">else</span><span class="p">:</span>
- <span class="n">agent_name</span> <span class="o">=</span> <span class="n">sub_action</span><span class="p">[</span><span class="s2">"agent"</span><span class="p">]</span>
- <span class="n">sub_agent_output</span> <span class="o">=</span> <span class="bp">self</span><span class="o">.</span><span class="n">call_subroutine</span><span class="p">(</span><span class="n">agent_name</span><span class="p">,</span> <span class="n">sub_action</span><span class="p">,</span> <span class="bp">self</span><span class="o">.</span><span class="n">_env</span><span class="p">)</span>
- <span class="n">observation</span> <span class="o">=</span> <span class="n">sub_agent_output</span>
- <span class="k">assert</span> <span class="nb">isinstance</span><span class="p">(</span><span class="n">observation</span><span class="p">,</span> <span class="nb">str</span><span class="p">)</span> <span class="ow">or</span> <span class="n">observation</span> <span class="ow">is</span> <span class="kc">None</span>
- <span class="n">done</span> <span class="o">=</span> <span class="kc">False</span>
- <span class="k">return</span> <span class="n">observation</span><span class="p">,</span> <span class="n">done</span>
- <span class="k">def</span> <span class="nf">_run_step</span><span class="p">(</span><span class="bp">self</span><span class="p">,</span> <span class="n">observation</span><span class="p">:</span> <span class="nb">str</span> <span class="o">|</span> <span class="kc">None</span><span class="p">)</span> <span class="o">-></span> <span class="nb">tuple</span><span class="p">[</span><span class="nb">str</span> <span class="o">|</span> <span class="kc">None</span><span class="p">,</span> <span class="nb">bool</span><span class="p">]:</span>
- <span class="w"> </span><span class="sd">"""Run a step of the agent (forward, execute, and save).</span>
- <span class="sd"> Returns:</span>
- <span class="sd"> observation: Observation</span>
- <span class="sd"> done: Whether `submit` or another exit reason was called</span>
- <span class="sd"> """</span>
- <span class="k">assert</span> <span class="bp">self</span><span class="o">.</span><span class="n">config</span> <span class="ow">is</span> <span class="ow">not</span> <span class="kc">None</span> <span class="c1"># mypy</span>
- <span class="k">assert</span> <span class="bp">self</span><span class="o">.</span><span class="n">_env</span> <span class="ow">is</span> <span class="ow">not</span> <span class="kc">None</span>
- <span class="k">for</span> <span class="n">hook</span> <span class="ow">in</span> <span class="bp">self</span><span class="o">.</span><span class="n">hooks</span><span class="p">:</span>
- <span class="n">hook</span><span class="o">.</span><span class="n">on_step_start</span><span class="p">()</span>
- <span class="c1"># fixme: This will probably fail if the state command is not set</span>
- <span class="n">state</span> <span class="o">=</span> <span class="bp">self</span><span class="o">.</span><span class="n">_env</span><span class="o">.</span><span class="n">communicate</span><span class="p">(</span><span class="bp">self</span><span class="o">.</span><span class="n">state_command</span><span class="p">)</span> <span class="k">if</span> <span class="bp">self</span><span class="o">.</span><span class="n">state_command</span> <span class="k">else</span> <span class="kc">None</span>
- <span class="n">thought</span><span class="p">,</span> <span class="n">action</span><span class="p">,</span> <span class="n">output</span> <span class="o">=</span> <span class="bp">self</span><span class="o">.</span><span class="n">forward</span><span class="p">(</span><span class="n">observation</span><span class="p">,</span> <span class="bp">self</span><span class="o">.</span><span class="n">_env</span><span class="o">.</span><span class="n">get_available_actions</span><span class="p">(),</span> <span class="n">state</span><span class="p">)</span>
- <span class="k">for</span> <span class="n">hook</span> <span class="ow">in</span> <span class="bp">self</span><span class="o">.</span><span class="n">hooks</span><span class="p">:</span>
- <span class="n">hook</span><span class="o">.</span><span class="n">on_actions_generated</span><span class="p">(</span><span class="n">thought</span><span class="o">=</span><span class="n">thought</span><span class="p">,</span> <span class="n">action</span><span class="o">=</span><span class="n">action</span><span class="p">,</span> <span class="n">output</span><span class="o">=</span><span class="n">output</span><span class="p">)</span>
- <span class="n">run_action</span><span class="p">:</span> <span class="nb">str</span> <span class="o">=</span> <span class="bp">self</span><span class="o">.</span><span class="n">_guard_multiline_input</span><span class="p">(</span><span class="n">action</span><span class="p">)</span>
- <span class="c1"># Loop over sub-actions (if any)</span>
- <span class="n">done</span> <span class="o">=</span> <span class="kc">False</span>
- <span class="n">observations</span><span class="p">:</span> <span class="nb">list</span><span class="p">[</span><span class="nb">str</span> <span class="o">|</span> <span class="kc">None</span><span class="p">]</span> <span class="o">=</span> <span class="nb">list</span><span class="p">()</span>
- <span class="n">execution_t0</span> <span class="o">=</span> <span class="n">time</span><span class="o">.</span><span class="n">perf_counter</span><span class="p">()</span>
- <span class="k">for</span> <span class="n">sub_action</span> <span class="ow">in</span> <span class="bp">self</span><span class="o">.</span><span class="n">split_actions</span><span class="p">(</span><span class="n">run_action</span><span class="p">):</span>
- <span class="n">observation</span><span class="p">,</span> <span class="n">done</span> <span class="o">=</span> <span class="bp">self</span><span class="o">.</span><span class="n">_run_sub_action</span><span class="p">(</span><span class="n">sub_action</span><span class="p">)</span>
- <span class="c1"># If the last sub-action is done, the observation is not</span>
- <span class="c1"># appended.</span>
- <span class="k">if</span> <span class="n">done</span><span class="p">:</span>
- <span class="k">break</span>
- <span class="n">observations</span><span class="o">.</span><span class="n">append</span><span class="p">(</span><span class="n">observation</span><span class="p">)</span>
- <span class="n">observation</span> <span class="o">=</span> <span class="s2">"</span><span class="se">\n</span><span class="s2">"</span><span class="o">.</span><span class="n">join</span><span class="p">([</span><span class="n">obs</span> <span class="k">for</span> <span class="n">obs</span> <span class="ow">in</span> <span class="n">observations</span> <span class="k">if</span> <span class="n">obs</span> <span class="ow">is</span> <span class="ow">not</span> <span class="kc">None</span><span class="p">])</span>
- <span class="n">execution_time</span> <span class="o">=</span> <span class="n">time</span><span class="o">.</span><span class="n">perf_counter</span><span class="p">()</span> <span class="o">-</span> <span class="n">execution_t0</span>
- <span class="n">trajectory_step</span> <span class="o">=</span> <span class="n">TrajectoryStep</span><span class="p">(</span>
- <span class="p">{</span>
- <span class="s2">"action"</span><span class="p">:</span> <span class="n">action</span><span class="p">,</span>
- <span class="s2">"observation"</span><span class="p">:</span> <span class="n">observation</span><span class="p">,</span>
- <span class="s2">"response"</span><span class="p">:</span> <span class="n">output</span><span class="p">,</span>
- <span class="s2">"state"</span><span class="p">:</span> <span class="n">state</span><span class="p">,</span>
- <span class="s2">"thought"</span><span class="p">:</span> <span class="n">thought</span><span class="p">,</span>
- <span class="s2">"execution_time"</span><span class="p">:</span> <span class="n">execution_time</span><span class="p">,</span>
- <span class="p">},</span>
- <span class="p">)</span>
- <span class="bp">self</span><span class="o">.</span><span class="n">trajectory</span><span class="o">.</span><span class="n">append</span><span class="p">(</span><span class="n">trajectory_step</span><span class="p">)</span>
- <span class="n">model_stats</span><span class="p">:</span> <span class="n">APIStats</span> <span class="o">=</span> <span class="bp">self</span><span class="o">.</span><span class="n">model</span><span class="o">.</span><span class="n">stats</span>
- <span class="bp">self</span><span class="o">.</span><span class="n">info</span><span class="p">[</span><span class="s2">"model_stats"</span><span class="p">]</span> <span class="o">=</span> <span class="n">model_stats</span><span class="o">.</span><span class="n">to_dict</span><span class="p">()</span>
- <span class="k">for</span> <span class="n">hook</span> <span class="ow">in</span> <span class="bp">self</span><span class="o">.</span><span class="n">hooks</span><span class="p">:</span>
- <span class="n">hook</span><span class="o">.</span><span class="n">on_step_done</span><span class="p">(</span><span class="n">trajectory_step</span><span class="o">=</span><span class="n">trajectory_step</span><span class="p">,</span> <span class="n">model_stats</span><span class="o">=</span><span class="n">model_stats</span><span class="p">)</span>
- <span class="k">return</span> <span class="n">observation</span><span class="p">,</span> <span class="n">done</span>
- <span class="k">def</span> <span class="nf">run</span><span class="p">(</span>
- <span class="bp">self</span><span class="p">,</span>
- <span class="n">setup_args</span><span class="p">:</span> <span class="nb">dict</span><span class="p">[</span><span class="nb">str</span><span class="p">,</span> <span class="n">Any</span><span class="p">],</span>
- <span class="n">env</span><span class="p">:</span> <span class="n">SWEEnv</span><span class="p">,</span>
- <span class="n">observation</span><span class="p">:</span> <span class="nb">str</span> <span class="o">|</span> <span class="kc">None</span> <span class="o">=</span> <span class="kc">None</span><span class="p">,</span>
- <span class="n">traj_dir</span><span class="p">:</span> <span class="n">Path</span> <span class="o">|</span> <span class="kc">None</span> <span class="o">=</span> <span class="kc">None</span><span class="p">,</span>
- <span class="n">return_type</span><span class="p">:</span> <span class="nb">str</span> <span class="o">=</span> <span class="s2">"info_trajectory"</span><span class="p">,</span>
- <span class="n">init_model_stats</span><span class="p">:</span> <span class="n">APIStats</span> <span class="o">|</span> <span class="kc">None</span> <span class="o">=</span> <span class="kc">None</span><span class="p">,</span>
- <span class="p">):</span>
- <span class="w"> </span><span class="sd">"""</span>
- <span class="sd"> Run the agent on an environment.</span>
- <span class="sd"> Return the final value of the specified return type.</span>
- <span class="sd"> Args:</span>
- <span class="sd"> setup_args: Arguments to pass to the agent's setup method.</span>
- <span class="sd"> env: The environment to run the agent on.</span>
- <span class="sd"> observation: Output from environment setup</span>
- <span class="sd"> traj_dir: Directory to save the trajectory to</span>
- <span class="sd"> return_type: Controls what to return.</span>
- <span class="sd"> This should be left at `info_trajectory`, the</span>
- <span class="sd"> other values are for internal usage with subroutines.</span>
- <span class="sd"> init_model_stats: Initial model stats to use for the run.</span>
- <span class="sd"> Returns:</span>
- <span class="sd"> If return_type is "info_trajectory", returns a tuple of</span>
- <span class="sd"> the info dictionary and the trajectory (list of dictionaries).</span>
- <span class="sd"> """</span>
- <span class="k">assert</span> <span class="n">env</span><span class="o">.</span><span class="n">record</span> <span class="ow">is</span> <span class="ow">not</span> <span class="kc">None</span>
- <span class="k">assert</span> <span class="n">env</span><span class="o">.</span><span class="n">container_obj</span> <span class="ow">is</span> <span class="ow">not</span> <span class="kc">None</span>
- <span class="k">if</span> <span class="n">env</span><span class="o">.</span><span class="n">container_obj</span><span class="o">.</span><span class="n">id</span> <span class="o">!=</span> <span class="bp">self</span><span class="o">.</span><span class="n">last_container_id</span><span class="p">:</span>
- <span class="bp">self</span><span class="o">.</span><span class="n">logger</span><span class="o">.</span><span class="n">info</span><span class="p">(</span><span class="sa">f</span><span class="s2">"Initializing agent settings for container </span><span class="si">{</span><span class="n">env</span><span class="o">.</span><span class="n">container_obj</span><span class="o">.</span><span class="n">id</span><span class="si">}</span><span class="s2">"</span><span class="p">)</span>
- <span class="bp">self</span><span class="o">.</span><span class="n">init_environment_vars</span><span class="p">(</span><span class="n">env</span><span class="p">)</span>
- <span class="bp">self</span><span class="o">.</span><span class="n">last_container_id</span> <span class="o">=</span> <span class="n">env</span><span class="o">.</span><span class="n">container_obj</span><span class="o">.</span><span class="n">id</span>
- <span class="c1"># Re-initialize primary</span>
- <span class="bp">self</span><span class="o">.</span><span class="n">setup</span><span class="p">(</span><span class="n">setup_args</span><span class="p">,</span> <span class="n">init_model_stats</span><span class="p">)</span>
- <span class="bp">self</span><span class="o">.</span><span class="n">config</span><span class="o">.</span><span class="n">summarizer_config</span><span class="o">.</span><span class="n">function</span><span class="o">.</span><span class="n">setup</span><span class="p">(</span><span class="n">setup_args</span><span class="p">,</span> <span class="bp">self</span><span class="o">.</span><span class="n">config</span><span class="p">)</span>
- <span class="c1"># Save/reset some attributes</span>
- <span class="bp">self</span><span class="o">.</span><span class="n">trajectory</span> <span class="o">=</span> <span class="n">Trajectory</span><span class="p">()</span>
- <span class="bp">self</span><span class="o">.</span><span class="n">_env</span> <span class="o">=</span> <span class="n">env</span>
- <span class="bp">self</span><span class="o">.</span><span class="n">info</span> <span class="o">=</span> <span class="n">AgentInfo</span><span class="p">()</span>
- <span class="bp">self</span><span class="o">.</span><span class="n">traj_dir</span> <span class="o">=</span> <span class="n">traj_dir</span>
- <span class="bp">self</span><span class="o">.</span><span class="n">logger</span><span class="o">.</span><span class="n">info</span><span class="p">(</span><span class="s2">"Trajectory will be saved to </span><span class="si">%s</span><span class="s2">"</span><span class="p">,</span> <span class="bp">self</span><span class="o">.</span><span class="n">traj_path</span><span class="p">)</span>
- <span class="c1"># Run action/observation loop</span>
- <span class="k">for</span> <span class="n">hook</span> <span class="ow">in</span> <span class="bp">self</span><span class="o">.</span><span class="n">hooks</span><span class="p">:</span>
- <span class="n">hook</span><span class="o">.</span><span class="n">on_run_start</span><span class="p">()</span>
- <span class="n">done</span> <span class="o">=</span> <span class="kc">False</span>
- <span class="k">while</span> <span class="ow">not</span> <span class="n">done</span><span class="p">:</span>
- <span class="n">observation</span><span class="p">,</span> <span class="n">done</span> <span class="o">=</span> <span class="bp">self</span><span class="o">.</span><span class="n">_run_step</span><span class="p">(</span><span class="n">observation</span><span class="p">)</span>
- <span class="bp">self</span><span class="o">.</span><span class="n">save_trajectory</span><span class="p">()</span>
- <span class="k">if</span> <span class="n">done</span><span class="p">:</span>
- <span class="n">done</span> <span class="o">=</span> <span class="kc">True</span>
- <span class="k">for</span> <span class="n">hook</span> <span class="ow">in</span> <span class="bp">self</span><span class="o">.</span><span class="n">hooks</span><span class="p">:</span>
- <span class="n">hook</span><span class="o">.</span><span class="n">on_run_done</span><span class="p">(</span><span class="n">trajectory</span><span class="o">=</span><span class="bp">self</span><span class="o">.</span><span class="n">trajectory</span><span class="p">,</span> <span class="n">info</span><span class="o">=</span><span class="bp">self</span><span class="o">.</span><span class="n">info</span><span class="p">)</span>
- <span class="bp">self</span><span class="o">.</span><span class="n">logger</span><span class="o">.</span><span class="n">info</span><span class="p">(</span><span class="s2">"Trajectory saved to </span><span class="si">%s</span><span class="s2">"</span><span class="p">,</span> <span class="bp">self</span><span class="o">.</span><span class="n">traj_path</span><span class="p">)</span>
- <span class="k">if</span> <span class="n">return_type</span> <span class="o">==</span> <span class="s2">"info"</span><span class="p">:</span>
- <span class="k">return</span> <span class="bp">self</span><span class="o">.</span><span class="n">info</span>
- <span class="k">if</span> <span class="n">return_type</span> <span class="o">==</span> <span class="s2">"info_trajectory"</span><span class="p">:</span>
- <span class="k">return</span> <span class="bp">self</span><span class="o">.</span><span class="n">info</span><span class="p">,</span> <span class="bp">self</span><span class="o">.</span><span class="n">trajectory</span>
- <span class="k">return</span> <span class="bp">self</span><span class="o">.</span><span class="n">trajectory</span><span class="p">[</span><span class="o">-</span><span class="mi">1</span><span class="p">][</span><span class="n">return_type</span><span class="p">]</span>
- </code></pre></div></td></tr></table></div>
- </details>
- <div class="doc doc-children">
- <div class="doc doc-object doc-attribute">
- <h3 id="sweagent.agent.agents.Agent.history" class="doc doc-heading">
- <code class="highlight language-python"><span class="n">history</span><span class="p">:</span> <span class="n">History</span></code>
- <span class="doc doc-labels">
- <small class="doc doc-label doc-label-property"><code>property</code></small>
- <small class="doc doc-label doc-label-writable"><code>writable</code></small>
- </span>
- </h3>
- <div class="doc doc-contents ">
- <p>History that is passed on to the model.
- Use <code>_append_history</code> to modify.</p>
- </div>
- </div>
- <div class="doc doc-object doc-attribute">
- <h3 id="sweagent.agent.agents.Agent.info" class="doc doc-heading">
- <code class="highlight language-python"><span class="n">info</span><span class="p">:</span> <span class="n">AgentInfo</span></code>
- <span class="doc doc-labels">
- <small class="doc doc-label doc-label-property"><code>property</code></small>
- <small class="doc doc-label doc-label-writable"><code>writable</code></small>
- </span>
- </h3>
- <div class="doc doc-contents ">
- <p>Information about the agent's run</p>
- </div>
- </div>
- <div class="doc doc-object doc-attribute">
- <h3 id="sweagent.agent.agents.Agent.local_history" class="doc doc-heading">
- <code class="highlight language-python"><span class="n">local_history</span><span class="p">:</span> <span class="nb">list</span><span class="p">[</span><span class="nb">dict</span><span class="p">[</span><span class="nb">str</span><span class="p">,</span> <span class="nb">str</span><span class="p">]]</span></code>
- <span class="doc doc-labels">
- <small class="doc doc-label doc-label-property"><code>property</code></small>
- </span>
- </h3>
- <div class="doc doc-contents ">
- <p>Return the history of the agent since the last reset.</p>
- </div>
- </div>
- <div class="doc doc-object doc-attribute">
- <h3 id="sweagent.agent.agents.Agent.state_command" class="doc doc-heading">
- <code class="highlight language-python"><span class="n">state_command</span><span class="p">:</span> <span class="nb">str</span></code>
- <span class="doc doc-labels">
- <small class="doc doc-label doc-label-property"><code>property</code></small>
- </span>
- </h3>
- <div class="doc doc-contents ">
- <p>Return the bash command that will be used to extract the environment state.</p>
- </div>
- </div>
- <div class="doc doc-object doc-attribute">
- <h3 id="sweagent.agent.agents.Agent.traj_path" class="doc doc-heading">
- <code class="highlight language-python"><span class="n">traj_path</span><span class="p">:</span> <span class="n">Path</span> <span class="o">|</span> <span class="kc">None</span></code>
- <span class="doc doc-labels">
- <small class="doc doc-label doc-label-property"><code>property</code></small>
- </span>
- </h3>
- <div class="doc doc-contents ">
- <p>Returns path to the trajectory.
- The path is reset for every new instance.</p>
- </div>
- </div>
- <div class="doc doc-object doc-attribute">
- <h3 id="sweagent.agent.agents.Agent.trajectory" class="doc doc-heading">
- <code class="highlight language-python"><span class="n">trajectory</span><span class="p">:</span> <span class="n">Trajectory</span></code>
- <span class="doc doc-labels">
- <small class="doc doc-label doc-label-property"><code>property</code></small>
- <small class="doc doc-label doc-label-writable"><code>writable</code></small>
- </span>
- </h3>
- <div class="doc doc-contents ">
- <p>Trajectory of the agent for the current instance. In contrast to <code>history</code>,
- this is mostly for the informational value of how the agent interacted with
- the environment and is also what is being used when replaying the trajectory</p>
- </div>
- </div>
- <div class="doc doc-object doc-function">
- <h3 id="sweagent.agent.agents.Agent.add_hook" class="doc doc-heading">
- <code class="highlight language-python"><span class="n">add_hook</span><span class="p">(</span><span class="n">hook</span><span class="p">)</span></code>
- </h3>
- <div class="doc doc-contents ">
- <p>Add hook to agent</p>
- <details class="quote">
- <summary>Source code in <code>sweagent/agent/agents.py</code></summary>
- <div class="highlight"><table class="highlighttable"><tr><td class="linenos"><div class="linenodiv"><pre><span></span><span class="normal">347</span>
- <span class="normal">348</span>
- <span class="normal">349</span>
- <span class="normal">350</span></pre></div></td><td class="code"><div><pre><span></span><code><span class="k">def</span> <span class="nf">add_hook</span><span class="p">(</span><span class="bp">self</span><span class="p">,</span> <span class="n">hook</span><span class="p">:</span> <span class="n">AgentHook</span><span class="p">)</span> <span class="o">-></span> <span class="kc">None</span><span class="p">:</span>
- <span class="w"> </span><span class="sd">"""Add hook to agent"""</span>
- <span class="n">hook</span><span class="o">.</span><span class="n">on_init</span><span class="p">(</span><span class="n">agent</span><span class="o">=</span><span class="bp">self</span><span class="p">)</span>
- <span class="bp">self</span><span class="o">.</span><span class="n">hooks</span><span class="o">.</span><span class="n">append</span><span class="p">(</span><span class="n">hook</span><span class="p">)</span>
- </code></pre></div></td></tr></table></div>
- </details>
- </div>
- </div>
- <div class="doc doc-object doc-function">
- <h3 id="sweagent.agent.agents.Agent.call_subroutine" class="doc doc-heading">
- <code class="highlight language-python"><span class="n">call_subroutine</span><span class="p">(</span><span class="n">agent_name</span><span class="p">,</span> <span class="n">sub_action</span><span class="p">,</span> <span class="n">env</span><span class="p">)</span></code>
- </h3>
- <div class="doc doc-contents ">
- <p>Call subroutine</p>
- <details class="quote">
- <summary>Source code in <code>sweagent/agent/agents.py</code></summary>
- <div class="highlight"><table class="highlighttable"><tr><td class="linenos"><div class="linenodiv"><pre><span></span><span class="normal">890</span>
- <span class="normal">891</span>
- <span class="normal">892</span>
- <span class="normal">893</span>
- <span class="normal">894</span>
- <span class="normal">895</span>
- <span class="normal">896</span>
- <span class="normal">897</span>
- <span class="normal">898</span>
- <span class="normal">899</span>
- <span class="normal">900</span>
- <span class="normal">901</span>
- <span class="normal">902</span>
- <span class="normal">903</span>
- <span class="normal">904</span>
- <span class="normal">905</span>
- <span class="normal">906</span>
- <span class="normal">907</span>
- <span class="normal">908</span>
- <span class="normal">909</span>
- <span class="normal">910</span>
- <span class="normal">911</span>
- <span class="normal">912</span>
- <span class="normal">913</span>
- <span class="normal">914</span>
- <span class="normal">915</span>
- <span class="normal">916</span>
- <span class="normal">917</span></pre></div></td><td class="code"><div><pre><span></span><code><span class="k">def</span> <span class="nf">call_subroutine</span><span class="p">(</span><span class="bp">self</span><span class="p">,</span> <span class="n">agent_name</span><span class="p">:</span> <span class="nb">str</span><span class="p">,</span> <span class="n">sub_action</span><span class="p">:</span> <span class="n">SubAction</span><span class="p">,</span> <span class="n">env</span><span class="p">:</span> <span class="n">SWEEnv</span><span class="p">):</span>
- <span class="w"> </span><span class="sd">"""Call subroutine"""</span>
- <span class="k">assert</span> <span class="bp">self</span><span class="o">.</span><span class="n">config</span> <span class="ow">is</span> <span class="ow">not</span> <span class="kc">None</span> <span class="c1"># mypy</span>
- <span class="n">env_vars</span> <span class="o">=</span> <span class="bp">self</span><span class="o">.</span><span class="n">get_environment_vars</span><span class="p">(</span><span class="n">env</span><span class="p">)</span>
- <span class="n">cwd</span> <span class="o">=</span> <span class="n">env</span><span class="o">.</span><span class="n">communicate</span><span class="p">(</span><span class="s2">"pwd -P"</span><span class="p">)</span><span class="o">.</span><span class="n">strip</span><span class="p">()</span>
- <span class="n">init_observation</span> <span class="o">=</span> <span class="bp">self</span><span class="o">.</span><span class="n">config</span><span class="o">.</span><span class="n">_subroutines</span><span class="p">[</span><span class="n">agent_name</span><span class="p">]</span><span class="o">.</span><span class="n">init_observation</span>
- <span class="k">if</span> <span class="n">init_observation</span> <span class="ow">is</span> <span class="ow">not</span> <span class="kc">None</span><span class="p">:</span>
- <span class="n">obs</span><span class="p">,</span> <span class="n">_</span><span class="p">,</span> <span class="n">_</span><span class="p">,</span> <span class="n">_</span> <span class="o">=</span> <span class="n">env</span><span class="o">.</span><span class="n">step</span><span class="p">(</span><span class="n">init_observation</span><span class="o">.</span><span class="n">format</span><span class="p">(</span><span class="n">args</span><span class="o">=</span><span class="n">sub_action</span><span class="p">[</span><span class="s2">"args"</span><span class="p">]))</span>
- <span class="k">else</span><span class="p">:</span>
- <span class="n">obs</span> <span class="o">=</span> <span class="kc">None</span>
- <span class="k">if</span> <span class="n">env</span><span class="o">.</span><span class="n">returncode</span> <span class="o">!=</span> <span class="mi">0</span><span class="p">:</span>
- <span class="bp">self</span><span class="o">.</span><span class="n">_append_history</span><span class="p">(</span><span class="n">HistoryItem</span><span class="p">({</span><span class="s2">"role"</span><span class="p">:</span> <span class="s2">"user"</span><span class="p">,</span> <span class="s2">"content"</span><span class="p">:</span> <span class="n">obs</span><span class="p">,</span> <span class="s2">"agent"</span><span class="p">:</span> <span class="n">agent_name</span><span class="p">}))</span>
- <span class="n">msg</span> <span class="o">=</span> <span class="sa">f</span><span class="s2">"Nonzero return code: </span><span class="si">{</span><span class="n">env</span><span class="o">.</span><span class="n">returncode</span><span class="si">}</span><span class="s2"> for init_observation in </span><span class="si">{</span><span class="n">agent_name</span><span class="si">}</span><span class="s2">.</span><span class="se">\n</span><span class="si">{</span><span class="n">obs</span><span class="si">}</span><span class="s2">"</span>
- <span class="k">raise</span> <span class="ne">RuntimeError</span><span class="p">(</span><span class="n">msg</span><span class="p">)</span>
- <span class="n">return_type</span> <span class="o">=</span> <span class="bp">self</span><span class="o">.</span><span class="n">config</span><span class="o">.</span><span class="n">_subroutines</span><span class="p">[</span><span class="n">agent_name</span><span class="p">]</span><span class="o">.</span><span class="n">return_type</span>
- <span class="n">sub_agent</span> <span class="o">=</span> <span class="n">Agent</span><span class="p">(</span><span class="n">agent_name</span><span class="p">,</span> <span class="bp">self</span><span class="o">.</span><span class="n">config</span><span class="o">.</span><span class="n">_subroutines</span><span class="p">[</span><span class="n">agent_name</span><span class="p">]</span><span class="o">.</span><span class="n">agent_args</span><span class="p">)</span>
- <span class="n">sub_agent_output</span> <span class="o">=</span> <span class="n">sub_agent</span><span class="o">.</span><span class="n">run</span><span class="p">(</span>
- <span class="p">{</span><span class="s2">"issue"</span><span class="p">:</span> <span class="n">sub_action</span><span class="p">[</span><span class="s2">"args"</span><span class="p">]},</span>
- <span class="n">env</span><span class="p">,</span>
- <span class="n">observation</span><span class="o">=</span><span class="n">obs</span><span class="p">,</span>
- <span class="n">return_type</span><span class="o">=</span><span class="n">return_type</span><span class="p">,</span>
- <span class="n">init_model_stats</span><span class="o">=</span><span class="bp">self</span><span class="o">.</span><span class="n">model</span><span class="o">.</span><span class="n">stats</span><span class="p">,</span>
- <span class="p">)</span>
- <span class="bp">self</span><span class="o">.</span><span class="n">history</span> <span class="o">+=</span> <span class="n">sub_agent</span><span class="o">.</span><span class="n">history</span>
- <span class="bp">self</span><span class="o">.</span><span class="n">set_environment_vars</span><span class="p">(</span><span class="n">env</span><span class="p">,</span> <span class="n">env_vars</span><span class="p">)</span>
- <span class="n">env</span><span class="o">.</span><span class="n">communicate</span><span class="p">(</span><span class="sa">f</span><span class="s2">"cd </span><span class="si">{</span><span class="n">cwd</span><span class="si">}</span><span class="s2">"</span><span class="p">)</span>
- <span class="bp">self</span><span class="o">.</span><span class="n">model</span><span class="o">.</span><span class="n">stats</span><span class="o">.</span><span class="n">replace</span><span class="p">(</span><span class="n">sub_agent</span><span class="o">.</span><span class="n">model</span><span class="o">.</span><span class="n">stats</span><span class="p">)</span>
- <span class="k">return</span> <span class="n">sub_agent_output</span>
- </code></pre></div></td></tr></table></div>
- </details>
- </div>
- </div>
- <div class="doc doc-object doc-function">
- <h3 id="sweagent.agent.agents.Agent.check_format_and_requery" class="doc doc-heading">
- <code class="highlight language-python"><span class="n">check_format_and_requery</span><span class="p">(</span><span class="n">output</span><span class="p">)</span></code>
- </h3>
- <div class="doc doc-contents ">
- <p>Query the model with the current state and observation with the appropriate template.</p>
- <p>Try to parse the output into a thought and action. Retry if the output is malformatted or the action is blocked.</p>
- <p><span class="doc-section-title">Returns:</span></p>
- <table>
- <thead>
- <tr>
- <th>Name</th> <th>Type</th>
- <th>Description</th>
- </tr>
- </thead>
- <tbody>
- <tr class="doc-section-item">
- <td><code>thought</code></td> <td>
- <code>str</code>
- </td>
- <td>
- <div class="doc-md-description">
- <p>model reasoning</p>
- </div>
- </td>
- </tr>
- <tr class="doc-section-item">
- <td><code>action</code></td> <td>
- <code>str</code>
- </td>
- <td>
- <div class="doc-md-description">
- <p>action that the model proposes</p>
- </div>
- </td>
- </tr>
- <tr class="doc-section-item">
- <td><code>output</code></td> <td>
- <code>str</code>
- </td>
- <td>
- <div class="doc-md-description">
- <p>raw model output</p>
- </div>
- </td>
- </tr>
- </tbody>
- </table>
- <details class="quote">
- <summary>Source code in <code>sweagent/agent/agents.py</code></summary>
- <div class="highlight"><table class="highlighttable"><tr><td class="linenos"><div class="linenodiv"><pre><span></span><span class="normal">744</span>
- <span class="normal">745</span>
- <span class="normal">746</span>
- <span class="normal">747</span>
- <span class="normal">748</span>
- <span class="normal">749</span>
- <span class="normal">750</span>
- <span class="normal">751</span>
- <span class="normal">752</span>
- <span class="normal">753</span>
- <span class="normal">754</span>
- <span class="normal">755</span>
- <span class="normal">756</span>
- <span class="normal">757</span>
- <span class="normal">758</span>
- <span class="normal">759</span>
- <span class="normal">760</span>
- <span class="normal">761</span>
- <span class="normal">762</span>
- <span class="normal">763</span>
- <span class="normal">764</span>
- <span class="normal">765</span>
- <span class="normal">766</span>
- <span class="normal">767</span>
- <span class="normal">768</span>
- <span class="normal">769</span>
- <span class="normal">770</span>
- <span class="normal">771</span>
- <span class="normal">772</span>
- <span class="normal">773</span>
- <span class="normal">774</span>
- <span class="normal">775</span>
- <span class="normal">776</span>
- <span class="normal">777</span>
- <span class="normal">778</span>
- <span class="normal">779</span>
- <span class="normal">780</span>
- <span class="normal">781</span>
- <span class="normal">782</span>
- <span class="normal">783</span>
- <span class="normal">784</span>
- <span class="normal">785</span>
- <span class="normal">786</span>
- <span class="normal">787</span>
- <span class="normal">788</span>
- <span class="normal">789</span></pre></div></td><td class="code"><div><pre><span></span><code><span class="k">def</span> <span class="nf">check_format_and_requery</span><span class="p">(</span>
- <span class="bp">self</span><span class="p">,</span>
- <span class="n">output</span><span class="p">:</span> <span class="nb">str</span><span class="p">,</span>
- <span class="p">)</span> <span class="o">-></span> <span class="nb">tuple</span><span class="p">[</span><span class="nb">str</span><span class="p">,</span> <span class="nb">str</span><span class="p">,</span> <span class="nb">str</span><span class="p">]:</span>
- <span class="w"> </span><span class="sd">"""Query the model with the current state and observation with the appropriate template.</span>
- <span class="sd"> Try to parse the output into a thought and action. Retry if the output is malformatted or the action is blocked.</span>
- <span class="sd"> Returns:</span>
- <span class="sd"> thought: model reasoning</span>
- <span class="sd"> action: action that the model proposes</span>
- <span class="sd"> output: raw model output</span>
- <span class="sd"> """</span>
- <span class="c1"># Condition for handling outputs with no thought (just action)</span>
- <span class="k">if</span> <span class="bp">self</span><span class="o">.</span><span class="n">model</span><span class="o">.</span><span class="n">args</span><span class="o">.</span><span class="n">model_name</span> <span class="o">==</span> <span class="s2">"human"</span><span class="p">:</span>
- <span class="k">return</span> <span class="s2">""</span><span class="p">,</span> <span class="n">output</span><span class="p">,</span> <span class="n">output</span>
- <span class="k">elif</span> <span class="bp">self</span><span class="o">.</span><span class="n">model</span><span class="o">.</span><span class="n">args</span><span class="o">.</span><span class="n">model_name</span> <span class="o">==</span> <span class="s2">"human_thought"</span><span class="p">:</span>
- <span class="n">thought</span><span class="p">,</span> <span class="n">action</span> <span class="o">=</span> <span class="n">ParseFunction</span><span class="o">.</span><span class="n">get</span><span class="p">(</span><span class="s2">"ThoughtActionParser"</span><span class="p">)(</span>
- <span class="n">output</span><span class="p">,</span>
- <span class="bp">self</span><span class="o">.</span><span class="n">config</span><span class="o">.</span><span class="n">_commands</span> <span class="o">+</span> <span class="bp">self</span><span class="o">.</span><span class="n">config</span><span class="o">.</span><span class="n">subroutine_types</span><span class="p">,</span>
- <span class="n">strict</span><span class="o">=</span><span class="kc">False</span><span class="p">,</span>
- <span class="p">)</span>
- <span class="k">return</span> <span class="n">thought</span><span class="p">,</span> <span class="n">action</span><span class="p">,</span> <span class="n">output</span>
- <span class="n">format_fails</span> <span class="o">=</span> <span class="n">blocklist_fails</span> <span class="o">=</span> <span class="mi">0</span>
- <span class="k">while</span> <span class="n">format_fails</span> <span class="o">+</span> <span class="n">blocklist_fails</span> <span class="o"><=</span> <span class="mi">2</span><span class="p">:</span>
- <span class="k">try</span><span class="p">:</span>
- <span class="n">thought</span><span class="p">,</span> <span class="n">action</span> <span class="o">=</span> <span class="bp">self</span><span class="o">.</span><span class="n">config</span><span class="o">.</span><span class="n">parse_function</span><span class="p">(</span>
- <span class="n">output</span><span class="p">,</span>
- <span class="bp">self</span><span class="o">.</span><span class="n">config</span><span class="o">.</span><span class="n">_commands</span> <span class="o">+</span> <span class="bp">self</span><span class="o">.</span><span class="n">config</span><span class="o">.</span><span class="n">subroutine_types</span><span class="p">,</span>
- <span class="n">strict</span><span class="o">=</span><span class="kc">False</span><span class="p">,</span>
- <span class="p">)</span>
- <span class="k">except</span> <span class="ne">KeyboardInterrupt</span><span class="p">:</span>
- <span class="k">raise</span>
- <span class="k">except</span> <span class="n">FormatError</span><span class="p">:</span>
- <span class="n">format_fails</span> <span class="o">+=</span> <span class="mi">1</span>
- <span class="n">output</span> <span class="o">=</span> <span class="bp">self</span><span class="o">.</span><span class="n">retry_after_format_fail</span><span class="p">(</span><span class="n">output</span><span class="p">)</span>
- <span class="k">continue</span>
- <span class="k">if</span> <span class="bp">self</span><span class="o">.</span><span class="n">should_block_action</span><span class="p">(</span><span class="n">action</span><span class="p">):</span>
- <span class="n">blocklist_fails</span> <span class="o">+=</span> <span class="mi">1</span>
- <span class="n">output</span> <span class="o">=</span> <span class="bp">self</span><span class="o">.</span><span class="n">retry_after_blocklist_fail</span><span class="p">(</span><span class="n">output</span><span class="p">,</span> <span class="n">action</span><span class="p">)</span>
- <span class="k">else</span><span class="p">:</span>
- <span class="k">return</span> <span class="n">thought</span><span class="p">,</span> <span class="n">action</span><span class="p">,</span> <span class="n">output</span>
- <span class="bp">self</span><span class="o">.</span><span class="n">logger</span><span class="o">.</span><span class="n">warning</span><span class="p">(</span><span class="sa">f</span><span class="s2">"Malformat limit reached: </span><span class="se">\n</span><span class="si">{</span><span class="n">output</span><span class="si">}</span><span class="s2">"</span><span class="p">)</span>
- <span class="k">return</span> <span class="s2">"Exit due to format error"</span><span class="p">,</span> <span class="s2">"exit_format"</span><span class="p">,</span> <span class="n">output</span>
- </code></pre></div></td></tr></table></div>
- </details>
- </div>
- </div>
- <div class="doc doc-object doc-function">
- <h3 id="sweagent.agent.agents.Agent.forward" class="doc doc-heading">
- <code class="highlight language-python"><span class="n">forward</span><span class="p">(</span><span class="n">observation</span><span class="p">,</span> <span class="n">available_actions</span><span class="p">,</span> <span class="n">state</span><span class="p">)</span></code>
- </h3>
- <div class="doc doc-contents ">
- <p>Forwards the model</p>
- <p><span class="doc-section-title">Parameters:</span></p>
- <table>
- <thead>
- <tr>
- <th>Name</th>
- <th>Type</th>
- <th>Description</th>
- <th>Default</th>
- </tr>
- </thead>
- <tbody>
- <tr class="doc-section-item">
- <td><code>observation</code></td>
- <td>
- <code>str | None</code>
- </td>
- <td>
- <div class="doc-md-description">
- <p>Observation</p>
- </div>
- </td>
- <td>
- <em>required</em>
- </td>
- </tr>
- <tr class="doc-section-item">
- <td><code>available_actions</code></td>
- <td>
- <code>list[str]</code>
- </td>
- <td>
- <div class="doc-md-description">
- <p>Currently not used</p>
- </div>
- </td>
- <td>
- <em>required</em>
- </td>
- </tr>
- <tr class="doc-section-item">
- <td><code>state</code></td>
- <td>
- <code>str</code>
- </td>
- <td>
- <div class="doc-md-description">
-
- </div>
- </td>
- <td>
- <em>required</em>
- </td>
- </tr>
- </tbody>
- </table>
- <p><span class="doc-section-title">Returns:</span></p>
- <table>
- <thead>
- <tr>
- <th>Name</th> <th>Type</th>
- <th>Description</th>
- </tr>
- </thead>
- <tbody>
- <tr class="doc-section-item">
- <td><code>thought</code></td> <td>
- <code>str</code>
- </td>
- <td>
- <div class="doc-md-description">
- <p>model reasoning</p>
- </div>
- </td>
- </tr>
- <tr class="doc-section-item">
- <td><code>action</code></td> <td>
- <code>str</code>
- </td>
- <td>
- <div class="doc-md-description">
- <p>action that the model proposes</p>
- </div>
- </td>
- </tr>
- <tr class="doc-section-item">
- <td><code>output</code></td> <td>
- <code>str</code>
- </td>
- <td>
- <div class="doc-md-description">
- <p>raw model output (not output of the action)</p>
- </div>
- </td>
- </tr>
- </tbody>
- </table>
- <details class="quote">
- <summary>Source code in <code>sweagent/agent/agents.py</code></summary>
- <div class="highlight"><table class="highlighttable"><tr><td class="linenos"><div class="linenodiv"><pre><span></span><span class="normal">624</span>
- <span class="normal">625</span>
- <span class="normal">626</span>
- <span class="normal">627</span>
- <span class="normal">628</span>
- <span class="normal">629</span>
- <span class="normal">630</span>
- <span class="normal">631</span>
- <span class="normal">632</span>
- <span class="normal">633</span>
- <span class="normal">634</span>
- <span class="normal">635</span>
- <span class="normal">636</span>
- <span class="normal">637</span>
- <span class="normal">638</span>
- <span class="normal">639</span>
- <span class="normal">640</span>
- <span class="normal">641</span>
- <span class="normal">642</span>
- <span class="normal">643</span>
- <span class="normal">644</span>
- <span class="normal">645</span>
- <span class="normal">646</span>
- <span class="normal">647</span>
- <span class="normal">648</span>
- <span class="normal">649</span>
- <span class="normal">650</span>
- <span class="normal">651</span>
- <span class="normal">652</span></pre></div></td><td class="code"><div><pre><span></span><code><span class="k">def</span> <span class="nf">forward</span><span class="p">(</span><span class="bp">self</span><span class="p">,</span> <span class="n">observation</span><span class="p">:</span> <span class="nb">str</span> <span class="o">|</span> <span class="kc">None</span><span class="p">,</span> <span class="n">available_actions</span><span class="p">:</span> <span class="nb">list</span><span class="p">[</span><span class="nb">str</span><span class="p">],</span> <span class="n">state</span><span class="p">:</span> <span class="nb">str</span><span class="p">)</span> <span class="o">-></span> <span class="nb">tuple</span><span class="p">[</span><span class="nb">str</span><span class="p">,</span> <span class="nb">str</span><span class="p">,</span> <span class="nb">str</span><span class="p">]:</span>
- <span class="w"> </span><span class="sd">"""Forwards the model</span>
- <span class="sd"> Args:</span>
- <span class="sd"> observation: Observation</span>
- <span class="sd"> available_actions: Currently not used</span>
- <span class="sd"> state:</span>
- <span class="sd"> Returns:</span>
- <span class="sd"> thought: model reasoning</span>
- <span class="sd"> action: action that the model proposes</span>
- <span class="sd"> output: raw model output (not output of the action)</span>
- <span class="sd"> """</span>
- <span class="n">thought</span><span class="p">,</span> <span class="n">action</span><span class="p">,</span> <span class="n">output</span> <span class="o">=</span> <span class="bp">self</span><span class="o">.</span><span class="n">forward_with_error_check</span><span class="p">(</span><span class="n">observation</span><span class="p">,</span> <span class="n">state</span><span class="p">)</span>
- <span class="bp">self</span><span class="o">.</span><span class="n">_append_history</span><span class="p">(</span>
- <span class="p">{</span>
- <span class="s2">"role"</span><span class="p">:</span> <span class="s2">"assistant"</span><span class="p">,</span>
- <span class="s2">"content"</span><span class="p">:</span> <span class="n">output</span><span class="p">,</span>
- <span class="s2">"thought"</span><span class="p">:</span> <span class="n">thought</span><span class="p">,</span>
- <span class="s2">"action"</span><span class="p">:</span> <span class="n">action</span><span class="p">,</span>
- <span class="s2">"agent"</span><span class="p">:</span> <span class="bp">self</span><span class="o">.</span><span class="n">name</span><span class="p">,</span>
- <span class="p">},</span>
- <span class="p">)</span>
- <span class="bp">self</span><span class="o">.</span><span class="n">logger</span><span class="o">.</span><span class="n">info</span><span class="p">(</span><span class="sa">f</span><span class="s2">"💭 THOUGHT (</span><span class="si">{</span><span class="bp">self</span><span class="o">.</span><span class="n">name</span><span class="si">}</span><span class="s2">)</span><span class="se">\n</span><span class="si">{</span><span class="n">thought</span><span class="si">}</span><span class="s2">"</span><span class="p">)</span>
- <span class="bp">self</span><span class="o">.</span><span class="n">logger</span><span class="o">.</span><span class="n">info</span><span class="p">(</span><span class="sa">f</span><span class="s2">"🎬 ACTION (</span><span class="si">{</span><span class="bp">self</span><span class="o">.</span><span class="n">name</span><span class="si">}</span><span class="s2">)</span><span class="se">\n</span><span class="si">{</span><span class="n">action</span><span class="si">}</span><span class="s2">"</span><span class="p">)</span>
- <span class="k">return</span> <span class="n">thought</span><span class="p">,</span> <span class="n">action</span><span class="p">,</span> <span class="n">output</span>
- </code></pre></div></td></tr></table></div>
- </details>
- </div>
- </div>
- <div class="doc doc-object doc-function">
- <h3 id="sweagent.agent.agents.Agent.forward_model" class="doc doc-heading">
- <code class="highlight language-python"><span class="n">forward_model</span><span class="p">(</span><span class="n">observation</span><span class="p">,</span> <span class="n">state</span><span class="p">)</span></code>
- </h3>
- <div class="doc doc-contents ">
- <p>Query the model with the current state and observation with the appropriate template.</p>
- <p><span class="doc-section-title">Returns:</span></p>
- <table>
- <thead>
- <tr>
- <th>Name</th> <th>Type</th>
- <th>Description</th>
- </tr>
- </thead>
- <tbody>
- <tr class="doc-section-item">
- <td><code>output</code></td> <td>
- <code>str</code>
- </td>
- <td>
- <div class="doc-md-description">
- <p>raw model output (not output of the command)</p>
- </div>
- </td>
- </tr>
- </tbody>
- </table>
- <details class="quote">
- <summary>Source code in <code>sweagent/agent/agents.py</code></summary>
- <div class="highlight"><table class="highlighttable"><tr><td class="linenos"><div class="linenodiv"><pre><span></span><span class="normal">654</span>
- <span class="normal">655</span>
- <span class="normal">656</span>
- <span class="normal">657</span>
- <span class="normal">658</span>
- <span class="normal">659</span>
- <span class="normal">660</span>
- <span class="normal">661</span>
- <span class="normal">662</span>
- <span class="normal">663</span>
- <span class="normal">664</span>
- <span class="normal">665</span>
- <span class="normal">666</span>
- <span class="normal">667</span>
- <span class="normal">668</span>
- <span class="normal">669</span>
- <span class="normal">670</span>
- <span class="normal">671</span>
- <span class="normal">672</span>
- <span class="normal">673</span>
- <span class="normal">674</span>
- <span class="normal">675</span>
- <span class="normal">676</span>
- <span class="normal">677</span>
- <span class="normal">678</span>
- <span class="normal">679</span>
- <span class="normal">680</span>
- <span class="normal">681</span>
- <span class="normal">682</span>
- <span class="normal">683</span>
- <span class="normal">684</span>
- <span class="normal">685</span>
- <span class="normal">686</span>
- <span class="normal">687</span>
- <span class="normal">688</span>
- <span class="normal">689</span>
- <span class="normal">690</span>
- <span class="normal">691</span>
- <span class="normal">692</span>
- <span class="normal">693</span>
- <span class="normal">694</span>
- <span class="normal">695</span>
- <span class="normal">696</span>
- <span class="normal">697</span>
- <span class="normal">698</span>
- <span class="normal">699</span>
- <span class="normal">700</span>
- <span class="normal">701</span></pre></div></td><td class="code"><div><pre><span></span><code><span class="k">def</span> <span class="nf">forward_model</span><span class="p">(</span><span class="bp">self</span><span class="p">,</span> <span class="n">observation</span><span class="p">:</span> <span class="nb">str</span> <span class="o">|</span> <span class="kc">None</span><span class="p">,</span> <span class="n">state</span><span class="p">:</span> <span class="nb">str</span><span class="p">)</span> <span class="o">-></span> <span class="nb">str</span><span class="p">:</span>
- <span class="w"> </span><span class="sd">"""Query the model with the current state and observation with the appropriate template.</span>
- <span class="sd"> Returns:</span>
- <span class="sd"> output: raw model output (not output of the command)</span>
- <span class="sd"> """</span>
- <span class="k">assert</span> <span class="bp">self</span><span class="o">.</span><span class="n">config</span> <span class="ow">is</span> <span class="ow">not</span> <span class="kc">None</span> <span class="c1"># mypy</span>
- <span class="k">try</span><span class="p">:</span>
- <span class="n">state_vars</span> <span class="o">=</span> <span class="n">json</span><span class="o">.</span><span class="n">loads</span><span class="p">(</span><span class="n">state</span><span class="p">)</span>
- <span class="k">except</span> <span class="n">json</span><span class="o">.</span><span class="n">JSONDecodeError</span> <span class="k">as</span> <span class="n">e</span><span class="p">:</span>
- <span class="n">msg</span> <span class="o">=</span> <span class="sa">f</span><span class="s2">"State </span><span class="si">{</span><span class="n">state</span><span class="si">!r}</span><span class="s2"> is not valid json. This is an internal error, please report it."</span>
- <span class="k">raise</span> <span class="ne">ValueError</span><span class="p">(</span><span class="n">msg</span><span class="p">)</span> <span class="kn">from</span> <span class="nn">e</span>
- <span class="n">templates</span><span class="p">:</span> <span class="nb">list</span><span class="p">[</span><span class="nb">str</span><span class="p">]</span> <span class="o">=</span> <span class="p">[]</span>
- <span class="c1"># Determine observation template based on what prior observation was</span>
- <span class="k">if</span> <span class="bp">self</span><span class="o">.</span><span class="n">history</span><span class="p">[</span><span class="o">-</span><span class="mi">1</span><span class="p">][</span><span class="s2">"role"</span><span class="p">]</span> <span class="o">==</span> <span class="s2">"system"</span> <span class="ow">or</span> <span class="bp">self</span><span class="o">.</span><span class="n">history</span><span class="p">[</span><span class="o">-</span><span class="mi">1</span><span class="p">]</span><span class="o">.</span><span class="n">get</span><span class="p">(</span><span class="s2">"is_demo"</span><span class="p">,</span> <span class="kc">False</span><span class="p">):</span>
- <span class="c1"># Show instance template if prev. obs. was initial system message</span>
- <span class="n">templates</span> <span class="o">=</span> <span class="p">[</span><span class="bp">self</span><span class="o">.</span><span class="n">config</span><span class="o">.</span><span class="n">instance_template</span><span class="p">]</span>
- <span class="k">if</span> <span class="bp">self</span><span class="o">.</span><span class="n">config</span><span class="o">.</span><span class="n">strategy_template</span> <span class="ow">is</span> <span class="ow">not</span> <span class="kc">None</span><span class="p">:</span>
- <span class="n">templates</span><span class="o">.</span><span class="n">append</span><span class="p">(</span><span class="bp">self</span><span class="o">.</span><span class="n">config</span><span class="o">.</span><span class="n">strategy_template</span><span class="p">)</span>
- <span class="k">elif</span> <span class="n">observation</span> <span class="ow">is</span> <span class="kc">None</span> <span class="ow">or</span> <span class="n">observation</span><span class="o">.</span><span class="n">strip</span><span class="p">()</span> <span class="o">==</span> <span class="s2">""</span><span class="p">:</span>
- <span class="c1"># Show no output template if observation content was empty</span>
- <span class="n">templates</span> <span class="o">=</span> <span class="p">[</span><span class="bp">self</span><span class="o">.</span><span class="n">config</span><span class="o">.</span><span class="n">next_step_no_output_template</span><span class="p">]</span>
- <span class="k">else</span><span class="p">:</span>
- <span class="c1"># Show standard output template if there is observation content</span>
- <span class="n">templates</span> <span class="o">=</span> <span class="p">[</span><span class="bp">self</span><span class="o">.</span><span class="n">config</span><span class="o">.</span><span class="n">next_step_template</span><span class="p">]</span>
- <span class="c1"># Populate selected template(s) with information (e.g., issue, arguments, state)</span>
- <span class="n">messages</span> <span class="o">=</span> <span class="p">[]</span>
- <span class="k">for</span> <span class="n">template</span> <span class="ow">in</span> <span class="n">templates</span><span class="p">:</span>
- <span class="n">messages</span><span class="o">.</span><span class="n">append</span><span class="p">(</span>
- <span class="n">template</span><span class="o">.</span><span class="n">format</span><span class="p">(</span>
- <span class="o">**</span><span class="bp">self</span><span class="o">.</span><span class="n">instance_args</span><span class="p">,</span>
- <span class="o">**</span><span class="bp">self</span><span class="o">.</span><span class="n">system_args</span><span class="p">,</span>
- <span class="o">**</span><span class="n">state_vars</span><span class="p">,</span>
- <span class="n">observation</span><span class="o">=</span><span class="p">(</span><span class="n">observation</span> <span class="k">if</span> <span class="n">observation</span> <span class="ow">is</span> <span class="ow">not</span> <span class="kc">None</span> <span class="k">else</span> <span class="s2">""</span><span class="p">),</span>
- <span class="o">**</span><span class="bp">self</span><span class="o">.</span><span class="n">_forwarded_vars</span><span class="p">,</span>
- <span class="p">),</span>
- <span class="p">)</span>
- <span class="n">message</span> <span class="o">=</span> <span class="s2">"</span><span class="se">\n</span><span class="s2">"</span><span class="o">.</span><span class="n">join</span><span class="p">(</span><span class="n">messages</span><span class="p">)</span>
- <span class="bp">self</span><span class="o">.</span><span class="n">logger</span><span class="o">.</span><span class="n">info</span><span class="p">(</span><span class="sa">f</span><span class="s2">"🤖 MODEL INPUT</span><span class="se">\n</span><span class="si">{</span><span class="n">message</span><span class="si">}</span><span class="s2">"</span><span class="p">)</span>
- <span class="bp">self</span><span class="o">.</span><span class="n">_append_history</span><span class="p">({</span><span class="s2">"role"</span><span class="p">:</span> <span class="s2">"user"</span><span class="p">,</span> <span class="s2">"content"</span><span class="p">:</span> <span class="n">message</span><span class="p">,</span> <span class="s2">"agent"</span><span class="p">:</span> <span class="bp">self</span><span class="o">.</span><span class="n">name</span><span class="p">})</span>
- <span class="k">for</span> <span class="n">hook</span> <span class="ow">in</span> <span class="bp">self</span><span class="o">.</span><span class="n">hooks</span><span class="p">:</span>
- <span class="n">hook</span><span class="o">.</span><span class="n">on_model_query</span><span class="p">(</span><span class="n">query</span><span class="o">=</span><span class="bp">self</span><span class="o">.</span><span class="n">local_history</span><span class="p">,</span> <span class="n">agent</span><span class="o">=</span><span class="bp">self</span><span class="o">.</span><span class="n">name</span><span class="p">)</span>
- <span class="k">return</span> <span class="bp">self</span><span class="o">.</span><span class="n">model</span><span class="o">.</span><span class="n">query</span><span class="p">(</span><span class="bp">self</span><span class="o">.</span><span class="n">local_history</span><span class="p">)</span>
- </code></pre></div></td></tr></table></div>
- </details>
- </div>
- </div>
- <div class="doc doc-object doc-function">
- <h3 id="sweagent.agent.agents.Agent.forward_with_error_check" class="doc doc-heading">
- <code class="highlight language-python"><span class="n">forward_with_error_check</span><span class="p">(</span><span class="n">observation</span><span class="p">,</span> <span class="n">state</span><span class="p">)</span></code>
- </h3>
- <div class="doc doc-contents ">
- <p>Wrapper around <code>self.forward_model</code> that handles errors and retries
- due to format errors or blocked actions.</p>
- <p><span class="doc-section-title">Returns:</span></p>
- <table>
- <thead>
- <tr>
- <th>Name</th> <th>Type</th>
- <th>Description</th>
- </tr>
- </thead>
- <tbody>
- <tr class="doc-section-item">
- <td><code>thought</code></td> <td>
- <code>str</code>
- </td>
- <td>
- <div class="doc-md-description">
- <p>model reasoning</p>
- </div>
- </td>
- </tr>
- <tr class="doc-section-item">
- <td><code>action</code></td> <td>
- <code>str</code>
- </td>
- <td>
- <div class="doc-md-description">
- <p>action that the model proposes</p>
- </div>
- </td>
- </tr>
- <tr class="doc-section-item">
- <td><code>output</code></td> <td>
- <code>str</code>
- </td>
- <td>
- <div class="doc-md-description">
- <p>raw model output</p>
- </div>
- </td>
- </tr>
- </tbody>
- </table>
- <details class="quote">
- <summary>Source code in <code>sweagent/agent/agents.py</code></summary>
- <div class="highlight"><table class="highlighttable"><tr><td class="linenos"><div class="linenodiv"><pre><span></span><span class="normal">791</span>
- <span class="normal">792</span>
- <span class="normal">793</span>
- <span class="normal">794</span>
- <span class="normal">795</span>
- <span class="normal">796</span>
- <span class="normal">797</span>
- <span class="normal">798</span>
- <span class="normal">799</span>
- <span class="normal">800</span>
- <span class="normal">801</span>
- <span class="normal">802</span>
- <span class="normal">803</span>
- <span class="normal">804</span>
- <span class="normal">805</span>
- <span class="normal">806</span>
- <span class="normal">807</span>
- <span class="normal">808</span>
- <span class="normal">809</span>
- <span class="normal">810</span>
- <span class="normal">811</span>
- <span class="normal">812</span>
- <span class="normal">813</span>
- <span class="normal">814</span>
- <span class="normal">815</span>
- <span class="normal">816</span>
- <span class="normal">817</span>
- <span class="normal">818</span>
- <span class="normal">819</span>
- <span class="normal">820</span>
- <span class="normal">821</span>
- <span class="normal">822</span>
- <span class="normal">823</span></pre></div></td><td class="code"><div><pre><span></span><code><span class="k">def</span> <span class="nf">forward_with_error_check</span><span class="p">(</span><span class="bp">self</span><span class="p">,</span> <span class="n">observation</span><span class="p">:</span> <span class="nb">str</span> <span class="o">|</span> <span class="kc">None</span><span class="p">,</span> <span class="n">state</span><span class="p">:</span> <span class="nb">str</span><span class="p">)</span> <span class="o">-></span> <span class="nb">tuple</span><span class="p">[</span><span class="nb">str</span><span class="p">,</span> <span class="nb">str</span><span class="p">,</span> <span class="nb">str</span><span class="p">]:</span>
- <span class="w"> </span><span class="sd">"""Wrapper around `self.forward_model` that handles errors and retries</span>
- <span class="sd"> due to format errors or blocked actions.</span>
- <span class="sd"> Returns:</span>
- <span class="sd"> thought: model reasoning</span>
- <span class="sd"> action: action that the model proposes</span>
- <span class="sd"> output: raw model output</span>
- <span class="sd"> """</span>
- <span class="k">try</span><span class="p">:</span>
- <span class="k">return</span> <span class="bp">self</span><span class="o">.</span><span class="n">check_format_and_requery</span><span class="p">(</span><span class="bp">self</span><span class="o">.</span><span class="n">forward_model</span><span class="p">(</span><span class="n">observation</span><span class="p">,</span> <span class="n">state</span><span class="p">))</span>
- <span class="k">except</span> <span class="ne">KeyboardInterrupt</span><span class="p">:</span>
- <span class="k">raise</span>
- <span class="k">except</span> <span class="ne">RuntimeError</span> <span class="k">as</span> <span class="n">e</span><span class="p">:</span>
- <span class="bp">self</span><span class="o">.</span><span class="n">logger</span><span class="o">.</span><span class="n">warning</span><span class="p">(</span><span class="sa">f</span><span class="s2">"Runtime error: </span><span class="si">{</span><span class="n">e</span><span class="si">}</span><span class="s2">"</span><span class="p">)</span>
- <span class="k">return</span> <span class="p">(</span>
- <span class="sa">f</span><span class="s2">"Exit due to runtime error: </span><span class="si">{</span><span class="n">e</span><span class="si">}</span><span class="s2">"</span><span class="p">,</span>
- <span class="s2">"exit_error"</span><span class="p">,</span>
- <span class="sa">f</span><span class="s2">"exit due to runtime error: </span><span class="si">{</span><span class="n">e</span><span class="si">}</span><span class="s2">"</span><span class="p">,</span>
- <span class="p">)</span>
- <span class="k">except</span> <span class="n">ContextWindowExceededError</span><span class="p">:</span>
- <span class="bp">self</span><span class="o">.</span><span class="n">logger</span><span class="o">.</span><span class="n">warning</span><span class="p">(</span><span class="s2">"Context window exceeded"</span><span class="p">)</span>
- <span class="k">return</span> <span class="s2">"Exit due to context window"</span><span class="p">,</span> <span class="s2">"exit_context"</span><span class="p">,</span> <span class="s2">"Exit due to context window"</span>
- <span class="k">except</span> <span class="n">CostLimitExceededError</span><span class="p">:</span>
- <span class="bp">self</span><span class="o">.</span><span class="n">logger</span><span class="o">.</span><span class="n">warning</span><span class="p">(</span><span class="s2">"Cost limit exceeded"</span><span class="p">)</span>
- <span class="k">return</span> <span class="s2">"Exit due to cost limit"</span><span class="p">,</span> <span class="s2">"exit_cost"</span><span class="p">,</span> <span class="s2">"Exit due to cost limit"</span>
- <span class="k">except</span> <span class="n">RetryError</span> <span class="k">as</span> <span class="n">e</span><span class="p">:</span>
- <span class="bp">self</span><span class="o">.</span><span class="n">logger</span><span class="o">.</span><span class="n">warning</span><span class="p">(</span><span class="sa">f</span><span class="s2">"Retry error: </span><span class="si">{</span><span class="n">e</span><span class="si">}</span><span class="s2">"</span><span class="p">)</span>
- <span class="k">return</span> <span class="p">(</span>
- <span class="sa">f</span><span class="s2">"Exit due to retry error: </span><span class="si">{</span><span class="n">e</span><span class="si">}</span><span class="s2">"</span><span class="p">,</span>
- <span class="s2">"exit_api"</span><span class="p">,</span>
- <span class="sa">f</span><span class="s2">"exit due to retry error: </span><span class="si">{</span><span class="n">e</span><span class="si">}</span><span class="s2">"</span><span class="p">,</span>
- <span class="p">)</span>
- </code></pre></div></td></tr></table></div>
- </details>
- </div>
- </div>
- <div class="doc doc-object doc-function">
- <h3 id="sweagent.agent.agents.Agent.get_environment_vars" class="doc doc-heading">
- <code class="highlight language-python"><span class="n">get_environment_vars</span><span class="p">(</span><span class="n">env</span><span class="p">)</span></code>
- </h3>
- <div class="doc doc-contents ">
- <p>Get environment variables inside of the container</p>
- <details class="quote">
- <summary>Source code in <code>sweagent/agent/agents.py</code></summary>
- <div class="highlight"><table class="highlighttable"><tr><td class="linenos"><div class="linenodiv"><pre><span></span><span class="normal">882</span>
- <span class="normal">883</span>
- <span class="normal">884</span>
- <span class="normal">885</span>
- <span class="normal">886</span>
- <span class="normal">887</span>
- <span class="normal">888</span></pre></div></td><td class="code"><div><pre><span></span><code><span class="k">def</span> <span class="nf">get_environment_vars</span><span class="p">(</span><span class="bp">self</span><span class="p">,</span> <span class="n">env</span><span class="p">:</span> <span class="n">SWEEnv</span><span class="p">)</span> <span class="o">-></span> <span class="nb">dict</span><span class="p">[</span><span class="nb">str</span><span class="p">,</span> <span class="n">Any</span><span class="p">]:</span>
- <span class="w"> </span><span class="sd">"""Get environment variables inside of the container"""</span>
- <span class="k">assert</span> <span class="bp">self</span><span class="o">.</span><span class="n">config</span> <span class="ow">is</span> <span class="ow">not</span> <span class="kc">None</span> <span class="c1"># mypy</span>
- <span class="n">env_vars</span> <span class="o">=</span> <span class="nb">dict</span><span class="p">()</span>
- <span class="k">for</span> <span class="n">var</span> <span class="ow">in</span> <span class="bp">self</span><span class="o">.</span><span class="n">config</span><span class="o">.</span><span class="n">env_variables</span><span class="p">:</span>
- <span class="n">env_vars</span><span class="p">[</span><span class="n">var</span><span class="p">]</span> <span class="o">=</span> <span class="n">env</span><span class="o">.</span><span class="n">communicate</span><span class="p">(</span><span class="sa">f</span><span class="s2">"echo $</span><span class="si">{</span><span class="n">var</span><span class="si">}</span><span class="s2">"</span><span class="p">)</span><span class="o">.</span><span class="n">strip</span><span class="p">()</span>
- <span class="k">return</span> <span class="n">env_vars</span>
- </code></pre></div></td></tr></table></div>
- </details>
- </div>
- </div>
- <div class="doc doc-object doc-function">
- <h3 id="sweagent.agent.agents.Agent.retry_after_blocklist_fail" class="doc doc-heading">
- <code class="highlight language-python"><span class="n">retry_after_blocklist_fail</span><span class="p">(</span><span class="n">output</span><span class="p">,</span> <span class="n">action</span><span class="p">)</span></code>
- </h3>
- <div class="doc doc-contents ">
- <p>Ask the model to correct (without committing to persistent history) after a disallowed command</p>
- <details class="quote">
- <summary>Source code in <code>sweagent/agent/agents.py</code></summary>
- <div class="highlight"><table class="highlighttable"><tr><td class="linenos"><div class="linenodiv"><pre><span></span><span class="normal">716</span>
- <span class="normal">717</span>
- <span class="normal">718</span>
- <span class="normal">719</span>
- <span class="normal">720</span>
- <span class="normal">721</span>
- <span class="normal">722</span>
- <span class="normal">723</span>
- <span class="normal">724</span>
- <span class="normal">725</span>
- <span class="normal">726</span>
- <span class="normal">727</span>
- <span class="normal">728</span></pre></div></td><td class="code"><div><pre><span></span><code><span class="k">def</span> <span class="nf">retry_after_blocklist_fail</span><span class="p">(</span><span class="bp">self</span><span class="p">,</span> <span class="n">output</span><span class="p">:</span> <span class="nb">str</span><span class="p">,</span> <span class="n">action</span><span class="p">:</span> <span class="nb">str</span><span class="p">)</span> <span class="o">-></span> <span class="nb">str</span><span class="p">:</span>
- <span class="w"> </span><span class="sd">"""Ask the model to correct (without committing to persistent history) after a disallowed command"""</span>
- <span class="n">name</span> <span class="o">=</span> <span class="n">action</span><span class="o">.</span><span class="n">strip</span><span class="p">()</span><span class="o">.</span><span class="n">split</span><span class="p">()[</span><span class="mi">0</span><span class="p">]</span>
- <span class="n">blocklist_error_message</span> <span class="o">=</span> <span class="bp">self</span><span class="o">.</span><span class="n">config</span><span class="o">.</span><span class="n">blocklist_error_template</span><span class="o">.</span><span class="n">format</span><span class="p">(</span><span class="n">name</span><span class="o">=</span><span class="n">name</span><span class="p">)</span>
- <span class="bp">self</span><span class="o">.</span><span class="n">logger</span><span class="o">.</span><span class="n">warning</span><span class="p">(</span><span class="sa">f</span><span class="s2">"BLOCKLISTED OUTPUT</span><span class="se">\n</span><span class="si">{</span><span class="n">output</span><span class="si">}</span><span class="s2">"</span><span class="p">)</span>
- <span class="bp">self</span><span class="o">.</span><span class="n">logger</span><span class="o">.</span><span class="n">warning</span><span class="p">(</span><span class="sa">f</span><span class="s2">"BLOCKLIST ERROR</span><span class="se">\n</span><span class="si">{</span><span class="n">blocklist_error_message</span><span class="si">}</span><span class="s2">"</span><span class="p">)</span>
- <span class="n">temp_history</span> <span class="o">=</span> <span class="bp">self</span><span class="o">.</span><span class="n">local_history</span> <span class="o">+</span> <span class="p">[</span>
- <span class="p">{</span><span class="s2">"role"</span><span class="p">:</span> <span class="s2">"assistant"</span><span class="p">,</span> <span class="s2">"content"</span><span class="p">:</span> <span class="n">output</span><span class="p">,</span> <span class="s2">"agent"</span><span class="p">:</span> <span class="bp">self</span><span class="o">.</span><span class="n">name</span><span class="p">},</span>
- <span class="p">{</span><span class="s2">"role"</span><span class="p">:</span> <span class="s2">"user"</span><span class="p">,</span> <span class="s2">"content"</span><span class="p">:</span> <span class="n">blocklist_error_message</span><span class="p">,</span> <span class="s2">"agent"</span><span class="p">:</span> <span class="bp">self</span><span class="o">.</span><span class="n">name</span><span class="p">},</span>
- <span class="p">]</span>
- <span class="k">return</span> <span class="bp">self</span><span class="o">.</span><span class="n">model</span><span class="o">.</span><span class="n">query</span><span class="p">(</span><span class="n">temp_history</span><span class="p">)</span>
- </code></pre></div></td></tr></table></div>
- </details>
- </div>
- </div>
- <div class="doc doc-object doc-function">
- <h3 id="sweagent.agent.agents.Agent.retry_after_format_fail" class="doc doc-heading">
- <code class="highlight language-python"><span class="n">retry_after_format_fail</span><span class="p">(</span><span class="n">output</span><span class="p">)</span></code>
- </h3>
- <div class="doc doc-contents ">
- <p>Ask the model to correct (without committing to persistent history) after a malformatted model output</p>
- <details class="quote">
- <summary>Source code in <code>sweagent/agent/agents.py</code></summary>
- <div class="highlight"><table class="highlighttable"><tr><td class="linenos"><div class="linenodiv"><pre><span></span><span class="normal">703</span>
- <span class="normal">704</span>
- <span class="normal">705</span>
- <span class="normal">706</span>
- <span class="normal">707</span>
- <span class="normal">708</span>
- <span class="normal">709</span>
- <span class="normal">710</span>
- <span class="normal">711</span>
- <span class="normal">712</span>
- <span class="normal">713</span>
- <span class="normal">714</span></pre></div></td><td class="code"><div><pre><span></span><code><span class="k">def</span> <span class="nf">retry_after_format_fail</span><span class="p">(</span><span class="bp">self</span><span class="p">,</span> <span class="n">output</span><span class="p">:</span> <span class="nb">str</span><span class="p">)</span> <span class="o">-></span> <span class="nb">str</span><span class="p">:</span>
- <span class="w"> </span><span class="sd">"""Ask the model to correct (without committing to persistent history) after a malformatted model output"""</span>
- <span class="n">format_error_template</span> <span class="o">=</span> <span class="bp">self</span><span class="o">.</span><span class="n">config</span><span class="o">.</span><span class="n">format_error_template</span>
- <span class="bp">self</span><span class="o">.</span><span class="n">logger</span><span class="o">.</span><span class="n">warning</span><span class="p">(</span><span class="sa">f</span><span class="s2">"MALFORMED OUTPUT</span><span class="se">\n</span><span class="si">{</span><span class="n">output</span><span class="si">}</span><span class="s2">"</span><span class="p">)</span>
- <span class="bp">self</span><span class="o">.</span><span class="n">logger</span><span class="o">.</span><span class="n">warning</span><span class="p">(</span><span class="sa">f</span><span class="s2">"FORMAT ERROR</span><span class="se">\n</span><span class="si">{</span><span class="n">format_error_template</span><span class="si">}</span><span class="s2">"</span><span class="p">)</span>
- <span class="n">temp_history</span> <span class="o">=</span> <span class="bp">self</span><span class="o">.</span><span class="n">local_history</span> <span class="o">+</span> <span class="p">[</span>
- <span class="p">{</span><span class="s2">"role"</span><span class="p">:</span> <span class="s2">"assistant"</span><span class="p">,</span> <span class="s2">"content"</span><span class="p">:</span> <span class="n">output</span><span class="p">,</span> <span class="s2">"agent"</span><span class="p">:</span> <span class="bp">self</span><span class="o">.</span><span class="n">name</span><span class="p">},</span>
- <span class="p">{</span><span class="s2">"role"</span><span class="p">:</span> <span class="s2">"user"</span><span class="p">,</span> <span class="s2">"content"</span><span class="p">:</span> <span class="n">format_error_template</span><span class="p">,</span> <span class="s2">"agent"</span><span class="p">:</span> <span class="bp">self</span><span class="o">.</span><span class="n">name</span><span class="p">},</span>
- <span class="p">]</span>
- <span class="k">return</span> <span class="bp">self</span><span class="o">.</span><span class="n">model</span><span class="o">.</span><span class="n">query</span><span class="p">(</span><span class="n">temp_history</span><span class="p">)</span>
- </code></pre></div></td></tr></table></div>
- </details>
- </div>
- </div>
- <div class="doc doc-object doc-function">
- <h3 id="sweagent.agent.agents.Agent.run" class="doc doc-heading">
- <code class="highlight language-python"><span class="n">run</span><span class="p">(</span><span class="n">setup_args</span><span class="p">,</span> <span class="n">env</span><span class="p">,</span> <span class="n">observation</span><span class="o">=</span><span class="kc">None</span><span class="p">,</span> <span class="n">traj_dir</span><span class="o">=</span><span class="kc">None</span><span class="p">,</span> <span class="n">return_type</span><span class="o">=</span><span class="s1">'info_trajectory'</span><span class="p">,</span> <span class="n">init_model_stats</span><span class="o">=</span><span class="kc">None</span><span class="p">)</span></code>
- </h3>
- <div class="doc doc-contents ">
- <p>Run the agent on an environment.
- Return the final value of the specified return type.</p>
- <p><span class="doc-section-title">Parameters:</span></p>
- <table>
- <thead>
- <tr>
- <th>Name</th>
- <th>Type</th>
- <th>Description</th>
- <th>Default</th>
- </tr>
- </thead>
- <tbody>
- <tr class="doc-section-item">
- <td><code>setup_args</code></td>
- <td>
- <code>dict[str, <span title="typing.Any">Any</span>]</code>
- </td>
- <td>
- <div class="doc-md-description">
- <p>Arguments to pass to the agent's setup method.</p>
- </div>
- </td>
- <td>
- <em>required</em>
- </td>
- </tr>
- <tr class="doc-section-item">
- <td><code>env</code></td>
- <td>
- <code><a class="autorefs autorefs-internal" title="sweagent.environment.swe_env.SWEEnv" href="../env/#sweagent.environment.swe_env.SWEEnv">SWEEnv</a></code>
- </td>
- <td>
- <div class="doc-md-description">
- <p>The environment to run the agent on.</p>
- </div>
- </td>
- <td>
- <em>required</em>
- </td>
- </tr>
- <tr class="doc-section-item">
- <td><code>observation</code></td>
- <td>
- <code>str | None</code>
- </td>
- <td>
- <div class="doc-md-description">
- <p>Output from environment setup</p>
- </div>
- </td>
- <td>
- <code>None</code>
- </td>
- </tr>
- <tr class="doc-section-item">
- <td><code>traj_dir</code></td>
- <td>
- <code><span title="pathlib.Path">Path</span> | None</code>
- </td>
- <td>
- <div class="doc-md-description">
- <p>Directory to save the trajectory to</p>
- </div>
- </td>
- <td>
- <code>None</code>
- </td>
- </tr>
- <tr class="doc-section-item">
- <td><code>return_type</code></td>
- <td>
- <code>str</code>
- </td>
- <td>
- <div class="doc-md-description">
- <p>Controls what to return.
- This should be left at <code>info_trajectory</code>, the
- other values are for internal usage with subroutines.</p>
- </div>
- </td>
- <td>
- <code>'info_trajectory'</code>
- </td>
- </tr>
- <tr class="doc-section-item">
- <td><code>init_model_stats</code></td>
- <td>
- <code><span title="sweagent.agent.models.APIStats">APIStats</span> | None</code>
- </td>
- <td>
- <div class="doc-md-description">
- <p>Initial model stats to use for the run.</p>
- </div>
- </td>
- <td>
- <code>None</code>
- </td>
- </tr>
- </tbody>
- </table>
- <p><span class="doc-section-title">Returns:</span></p>
- <table>
- <thead>
- <tr>
- <th>Type</th>
- <th>Description</th>
- </tr>
- </thead>
- <tbody>
- <tr class="doc-section-item">
- <td>
- </td>
- <td>
- <div class="doc-md-description">
- <p>If return_type is "info_trajectory", returns a tuple of</p>
- </div>
- </td>
- </tr>
- <tr class="doc-section-item">
- <td>
- </td>
- <td>
- <div class="doc-md-description">
- <p>the info dictionary and the trajectory (list of dictionaries).</p>
- </div>
- </td>
- </tr>
- </tbody>
- </table>
- <details class="quote">
- <summary>Source code in <code>sweagent/agent/agents.py</code></summary>
- <div class="highlight"><table class="highlighttable"><tr><td class="linenos"><div class="linenodiv"><pre><span></span><span class="normal">1016</span>
- <span class="normal">1017</span>
- <span class="normal">1018</span>
- <span class="normal">1019</span>
- <span class="normal">1020</span>
- <span class="normal">1021</span>
- <span class="normal">1022</span>
- <span class="normal">1023</span>
- <span class="normal">1024</span>
- <span class="normal">1025</span>
- <span class="normal">1026</span>
- <span class="normal">1027</span>
- <span class="normal">1028</span>
- <span class="normal">1029</span>
- <span class="normal">1030</span>
- <span class="normal">1031</span>
- <span class="normal">1032</span>
- <span class="normal">1033</span>
- <span class="normal">1034</span>
- <span class="normal">1035</span>
- <span class="normal">1036</span>
- <span class="normal">1037</span>
- <span class="normal">1038</span>
- <span class="normal">1039</span>
- <span class="normal">1040</span>
- <span class="normal">1041</span>
- <span class="normal">1042</span>
- <span class="normal">1043</span>
- <span class="normal">1044</span>
- <span class="normal">1045</span>
- <span class="normal">1046</span>
- <span class="normal">1047</span>
- <span class="normal">1048</span>
- <span class="normal">1049</span>
- <span class="normal">1050</span>
- <span class="normal">1051</span>
- <span class="normal">1052</span>
- <span class="normal">1053</span>
- <span class="normal">1054</span>
- <span class="normal">1055</span>
- <span class="normal">1056</span>
- <span class="normal">1057</span>
- <span class="normal">1058</span>
- <span class="normal">1059</span>
- <span class="normal">1060</span>
- <span class="normal">1061</span>
- <span class="normal">1062</span>
- <span class="normal">1063</span>
- <span class="normal">1064</span>
- <span class="normal">1065</span>
- <span class="normal">1066</span>
- <span class="normal">1067</span>
- <span class="normal">1068</span>
- <span class="normal">1069</span>
- <span class="normal">1070</span>
- <span class="normal">1071</span>
- <span class="normal">1072</span>
- <span class="normal">1073</span>
- <span class="normal">1074</span>
- <span class="normal">1075</span>
- <span class="normal">1076</span>
- <span class="normal">1077</span>
- <span class="normal">1078</span>
- <span class="normal">1079</span></pre></div></td><td class="code"><div><pre><span></span><code><span class="k">def</span> <span class="nf">run</span><span class="p">(</span>
- <span class="bp">self</span><span class="p">,</span>
- <span class="n">setup_args</span><span class="p">:</span> <span class="nb">dict</span><span class="p">[</span><span class="nb">str</span><span class="p">,</span> <span class="n">Any</span><span class="p">],</span>
- <span class="n">env</span><span class="p">:</span> <span class="n">SWEEnv</span><span class="p">,</span>
- <span class="n">observation</span><span class="p">:</span> <span class="nb">str</span> <span class="o">|</span> <span class="kc">None</span> <span class="o">=</span> <span class="kc">None</span><span class="p">,</span>
- <span class="n">traj_dir</span><span class="p">:</span> <span class="n">Path</span> <span class="o">|</span> <span class="kc">None</span> <span class="o">=</span> <span class="kc">None</span><span class="p">,</span>
- <span class="n">return_type</span><span class="p">:</span> <span class="nb">str</span> <span class="o">=</span> <span class="s2">"info_trajectory"</span><span class="p">,</span>
- <span class="n">init_model_stats</span><span class="p">:</span> <span class="n">APIStats</span> <span class="o">|</span> <span class="kc">None</span> <span class="o">=</span> <span class="kc">None</span><span class="p">,</span>
- <span class="p">):</span>
- <span class="w"> </span><span class="sd">"""</span>
- <span class="sd"> Run the agent on an environment.</span>
- <span class="sd"> Return the final value of the specified return type.</span>
- <span class="sd"> Args:</span>
- <span class="sd"> setup_args: Arguments to pass to the agent's setup method.</span>
- <span class="sd"> env: The environment to run the agent on.</span>
- <span class="sd"> observation: Output from environment setup</span>
- <span class="sd"> traj_dir: Directory to save the trajectory to</span>
- <span class="sd"> return_type: Controls what to return.</span>
- <span class="sd"> This should be left at `info_trajectory`, the</span>
- <span class="sd"> other values are for internal usage with subroutines.</span>
- <span class="sd"> init_model_stats: Initial model stats to use for the run.</span>
- <span class="sd"> Returns:</span>
- <span class="sd"> If return_type is "info_trajectory", returns a tuple of</span>
- <span class="sd"> the info dictionary and the trajectory (list of dictionaries).</span>
- <span class="sd"> """</span>
- <span class="k">assert</span> <span class="n">env</span><span class="o">.</span><span class="n">record</span> <span class="ow">is</span> <span class="ow">not</span> <span class="kc">None</span>
- <span class="k">assert</span> <span class="n">env</span><span class="o">.</span><span class="n">container_obj</span> <span class="ow">is</span> <span class="ow">not</span> <span class="kc">None</span>
- <span class="k">if</span> <span class="n">env</span><span class="o">.</span><span class="n">container_obj</span><span class="o">.</span><span class="n">id</span> <span class="o">!=</span> <span class="bp">self</span><span class="o">.</span><span class="n">last_container_id</span><span class="p">:</span>
- <span class="bp">self</span><span class="o">.</span><span class="n">logger</span><span class="o">.</span><span class="n">info</span><span class="p">(</span><span class="sa">f</span><span class="s2">"Initializing agent settings for container </span><span class="si">{</span><span class="n">env</span><span class="o">.</span><span class="n">container_obj</span><span class="o">.</span><span class="n">id</span><span class="si">}</span><span class="s2">"</span><span class="p">)</span>
- <span class="bp">self</span><span class="o">.</span><span class="n">init_environment_vars</span><span class="p">(</span><span class="n">env</span><span class="p">)</span>
- <span class="bp">self</span><span class="o">.</span><span class="n">last_container_id</span> <span class="o">=</span> <span class="n">env</span><span class="o">.</span><span class="n">container_obj</span><span class="o">.</span><span class="n">id</span>
- <span class="c1"># Re-initialize primary</span>
- <span class="bp">self</span><span class="o">.</span><span class="n">setup</span><span class="p">(</span><span class="n">setup_args</span><span class="p">,</span> <span class="n">init_model_stats</span><span class="p">)</span>
- <span class="bp">self</span><span class="o">.</span><span class="n">config</span><span class="o">.</span><span class="n">summarizer_config</span><span class="o">.</span><span class="n">function</span><span class="o">.</span><span class="n">setup</span><span class="p">(</span><span class="n">setup_args</span><span class="p">,</span> <span class="bp">self</span><span class="o">.</span><span class="n">config</span><span class="p">)</span>
- <span class="c1"># Save/reset some attributes</span>
- <span class="bp">self</span><span class="o">.</span><span class="n">trajectory</span> <span class="o">=</span> <span class="n">Trajectory</span><span class="p">()</span>
- <span class="bp">self</span><span class="o">.</span><span class="n">_env</span> <span class="o">=</span> <span class="n">env</span>
- <span class="bp">self</span><span class="o">.</span><span class="n">info</span> <span class="o">=</span> <span class="n">AgentInfo</span><span class="p">()</span>
- <span class="bp">self</span><span class="o">.</span><span class="n">traj_dir</span> <span class="o">=</span> <span class="n">traj_dir</span>
- <span class="bp">self</span><span class="o">.</span><span class="n">logger</span><span class="o">.</span><span class="n">info</span><span class="p">(</span><span class="s2">"Trajectory will be saved to </span><span class="si">%s</span><span class="s2">"</span><span class="p">,</span> <span class="bp">self</span><span class="o">.</span><span class="n">traj_path</span><span class="p">)</span>
- <span class="c1"># Run action/observation loop</span>
- <span class="k">for</span> <span class="n">hook</span> <span class="ow">in</span> <span class="bp">self</span><span class="o">.</span><span class="n">hooks</span><span class="p">:</span>
- <span class="n">hook</span><span class="o">.</span><span class="n">on_run_start</span><span class="p">()</span>
- <span class="n">done</span> <span class="o">=</span> <span class="kc">False</span>
- <span class="k">while</span> <span class="ow">not</span> <span class="n">done</span><span class="p">:</span>
- <span class="n">observation</span><span class="p">,</span> <span class="n">done</span> <span class="o">=</span> <span class="bp">self</span><span class="o">.</span><span class="n">_run_step</span><span class="p">(</span><span class="n">observation</span><span class="p">)</span>
- <span class="bp">self</span><span class="o">.</span><span class="n">save_trajectory</span><span class="p">()</span>
- <span class="k">if</span> <span class="n">done</span><span class="p">:</span>
- <span class="n">done</span> <span class="o">=</span> <span class="kc">True</span>
- <span class="k">for</span> <span class="n">hook</span> <span class="ow">in</span> <span class="bp">self</span><span class="o">.</span><span class="n">hooks</span><span class="p">:</span>
- <span class="n">hook</span><span class="o">.</span><span class="n">on_run_done</span><span class="p">(</span><span class="n">trajectory</span><span class="o">=</span><span class="bp">self</span><span class="o">.</span><span class="n">trajectory</span><span class="p">,</span> <span class="n">info</span><span class="o">=</span><span class="bp">self</span><span class="o">.</span><span class="n">info</span><span class="p">)</span>
- <span class="bp">self</span><span class="o">.</span><span class="n">logger</span><span class="o">.</span><span class="n">info</span><span class="p">(</span><span class="s2">"Trajectory saved to </span><span class="si">%s</span><span class="s2">"</span><span class="p">,</span> <span class="bp">self</span><span class="o">.</span><span class="n">traj_path</span><span class="p">)</span>
- <span class="k">if</span> <span class="n">return_type</span> <span class="o">==</span> <span class="s2">"info"</span><span class="p">:</span>
- <span class="k">return</span> <span class="bp">self</span><span class="o">.</span><span class="n">info</span>
- <span class="k">if</span> <span class="n">return_type</span> <span class="o">==</span> <span class="s2">"info_trajectory"</span><span class="p">:</span>
- <span class="k">return</span> <span class="bp">self</span><span class="o">.</span><span class="n">info</span><span class="p">,</span> <span class="bp">self</span><span class="o">.</span><span class="n">trajectory</span>
- <span class="k">return</span> <span class="bp">self</span><span class="o">.</span><span class="n">trajectory</span><span class="p">[</span><span class="o">-</span><span class="mi">1</span><span class="p">][</span><span class="n">return_type</span><span class="p">]</span>
- </code></pre></div></td></tr></table></div>
- </details>
- </div>
- </div>
- <div class="doc doc-object doc-function">
- <h3 id="sweagent.agent.agents.Agent.save_trajectory" class="doc doc-heading">
- <code class="highlight language-python"><span class="n">save_trajectory</span><span class="p">()</span></code>
- </h3>
- <div class="doc doc-contents ">
- <p>Save the trajectory to disk.
- This includes the history, the environment state, and the model stats.</p>
- <details class="quote">
- <summary>Source code in <code>sweagent/agent/agents.py</code></summary>
- <div class="highlight"><table class="highlighttable"><tr><td class="linenos"><div class="linenodiv"><pre><span></span><span class="normal">461</span>
- <span class="normal">462</span>
- <span class="normal">463</span>
- <span class="normal">464</span>
- <span class="normal">465</span>
- <span class="normal">466</span>
- <span class="normal">467</span>
- <span class="normal">468</span>
- <span class="normal">469</span>
- <span class="normal">470</span>
- <span class="normal">471</span>
- <span class="normal">472</span>
- <span class="normal">473</span>
- <span class="normal">474</span>
- <span class="normal">475</span>
- <span class="normal">476</span>
- <span class="normal">477</span>
- <span class="normal">478</span>
- <span class="normal">479</span>
- <span class="normal">480</span>
- <span class="normal">481</span>
- <span class="normal">482</span>
- <span class="normal">483</span>
- <span class="normal">484</span>
- <span class="normal">485</span>
- <span class="normal">486</span>
- <span class="normal">487</span></pre></div></td><td class="code"><div><pre><span></span><code><span class="k">def</span> <span class="nf">save_trajectory</span><span class="p">(</span>
- <span class="bp">self</span><span class="p">,</span>
- <span class="p">)</span> <span class="o">-></span> <span class="kc">None</span><span class="p">:</span>
- <span class="w"> </span><span class="sd">"""Save the trajectory to disk.</span>
- <span class="sd"> This includes the history, the environment state, and the model stats.</span>
- <span class="sd"> """</span>
- <span class="k">def</span> <span class="nf">get_attempt_data</span><span class="p">(</span><span class="n">attempt_idx</span><span class="p">:</span> <span class="nb">int</span><span class="p">)</span> <span class="o">-></span> <span class="nb">dict</span><span class="p">[</span><span class="nb">str</span><span class="p">,</span> <span class="n">Any</span><span class="p">]:</span>
- <span class="w"> </span><span class="sd">"""Get data saved for every attempt"""</span>
- <span class="k">assert</span> <span class="bp">self</span><span class="o">.</span><span class="n">_env</span> <span class="ow">is</span> <span class="ow">not</span> <span class="kc">None</span>
- <span class="c1"># The deepcopy here is important because else the</span>
- <span class="c1"># data["info"]["model_stats"] update will create havoc!</span>
- <span class="k">return</span> <span class="n">copy</span><span class="o">.</span><span class="n">deepcopy</span><span class="p">(</span>
- <span class="p">{</span>
- <span class="s2">"environment"</span><span class="p">:</span> <span class="bp">self</span><span class="o">.</span><span class="n">_env</span><span class="o">.</span><span class="n">name</span><span class="p">,</span>
- <span class="s2">"trajectory"</span><span class="p">:</span> <span class="bp">self</span><span class="o">.</span><span class="n">_trajectory_by_attempt</span><span class="p">[</span><span class="n">attempt_idx</span><span class="p">],</span>
- <span class="s2">"history"</span><span class="p">:</span> <span class="bp">self</span><span class="o">.</span><span class="n">_history_by_attempt</span><span class="p">[</span><span class="n">attempt_idx</span><span class="p">],</span>
- <span class="s2">"info"</span><span class="p">:</span> <span class="bp">self</span><span class="o">.</span><span class="n">_info_by_attempt</span><span class="p">[</span><span class="n">attempt_idx</span><span class="p">],</span>
- <span class="p">}</span>
- <span class="p">)</span>
- <span class="n">data</span> <span class="o">=</span> <span class="p">{</span>
- <span class="o">**</span><span class="n">get_attempt_data</span><span class="p">(</span><span class="mi">0</span><span class="p">),</span>
- <span class="p">}</span>
- <span class="k">assert</span> <span class="bp">self</span><span class="o">.</span><span class="n">traj_path</span> <span class="ow">is</span> <span class="ow">not</span> <span class="kc">None</span>
- <span class="bp">self</span><span class="o">.</span><span class="n">traj_path</span><span class="o">.</span><span class="n">write_text</span><span class="p">(</span><span class="n">json</span><span class="o">.</span><span class="n">dumps</span><span class="p">(</span><span class="n">data</span><span class="p">,</span> <span class="n">indent</span><span class="o">=</span><span class="mi">2</span><span class="p">))</span>
- </code></pre></div></td></tr></table></div>
- </details>
- </div>
- </div>
- <div class="doc doc-object doc-function">
- <h3 id="sweagent.agent.agents.Agent.set_environment_vars" class="doc doc-heading">
- <code class="highlight language-python"><span class="n">set_environment_vars</span><span class="p">(</span><span class="n">env</span><span class="p">,</span> <span class="n">env_variables</span><span class="p">)</span></code>
- </h3>
- <div class="doc doc-contents ">
- <p>Sets environment variables in the container and for example makes sure
- that all the commands are available in the PATH on the container.</p>
- <details class="quote">
- <summary>Source code in <code>sweagent/agent/agents.py</code></summary>
- <div class="highlight"><table class="highlighttable"><tr><td class="linenos"><div class="linenodiv"><pre><span></span><span class="normal">829</span>
- <span class="normal">830</span>
- <span class="normal">831</span>
- <span class="normal">832</span>
- <span class="normal">833</span>
- <span class="normal">834</span>
- <span class="normal">835</span>
- <span class="normal">836</span>
- <span class="normal">837</span>
- <span class="normal">838</span>
- <span class="normal">839</span>
- <span class="normal">840</span>
- <span class="normal">841</span>
- <span class="normal">842</span>
- <span class="normal">843</span>
- <span class="normal">844</span>
- <span class="normal">845</span>
- <span class="normal">846</span>
- <span class="normal">847</span>
- <span class="normal">848</span>
- <span class="normal">849</span>
- <span class="normal">850</span>
- <span class="normal">851</span>
- <span class="normal">852</span>
- <span class="normal">853</span>
- <span class="normal">854</span>
- <span class="normal">855</span>
- <span class="normal">856</span>
- <span class="normal">857</span>
- <span class="normal">858</span>
- <span class="normal">859</span>
- <span class="normal">860</span>
- <span class="normal">861</span>
- <span class="normal">862</span>
- <span class="normal">863</span>
- <span class="normal">864</span>
- <span class="normal">865</span>
- <span class="normal">866</span>
- <span class="normal">867</span>
- <span class="normal">868</span>
- <span class="normal">869</span>
- <span class="normal">870</span>
- <span class="normal">871</span>
- <span class="normal">872</span>
- <span class="normal">873</span>
- <span class="normal">874</span>
- <span class="normal">875</span>
- <span class="normal">876</span>
- <span class="normal">877</span>
- <span class="normal">878</span>
- <span class="normal">879</span>
- <span class="normal">880</span></pre></div></td><td class="code"><div><pre><span></span><code><span class="k">def</span> <span class="nf">set_environment_vars</span><span class="p">(</span><span class="bp">self</span><span class="p">,</span> <span class="n">env</span><span class="p">:</span> <span class="n">SWEEnv</span><span class="p">,</span> <span class="n">env_variables</span><span class="p">:</span> <span class="nb">dict</span><span class="p">[</span><span class="nb">str</span><span class="p">,</span> <span class="n">Any</span><span class="p">])</span> <span class="o">-></span> <span class="kc">None</span><span class="p">:</span>
- <span class="w"> </span><span class="sd">"""Sets environment variables in the container and for example makes sure</span>
- <span class="sd"> that all the commands are available in the PATH on the container.</span>
- <span class="sd"> """</span>
- <span class="k">assert</span> <span class="bp">self</span><span class="o">.</span><span class="n">config</span> <span class="ow">is</span> <span class="ow">not</span> <span class="kc">None</span> <span class="c1"># mypy</span>
- <span class="n">commands_to_execute</span> <span class="o">=</span> <span class="p">(</span>
- <span class="p">[</span><span class="bp">self</span><span class="o">.</span><span class="n">config</span><span class="o">.</span><span class="n">state_command</span><span class="o">.</span><span class="n">code</span><span class="p">]</span>
- <span class="o">+</span>
- <span class="c1"># [code for code in self.config.util_functions] +</span>
- <span class="c1"># [command.code for command in self.config._commands] +</span>
- <span class="p">[</span><span class="sa">f</span><span class="s2">"</span><span class="si">{</span><span class="n">k</span><span class="si">}</span><span class="s2">=</span><span class="si">{</span><span class="n">v</span><span class="si">}</span><span class="s2">"</span> <span class="k">for</span> <span class="n">k</span><span class="p">,</span> <span class="n">v</span> <span class="ow">in</span> <span class="n">env_variables</span><span class="o">.</span><span class="n">items</span><span class="p">()]</span>
- <span class="p">)</span>
- <span class="n">commands</span> <span class="o">=</span> <span class="s2">"</span><span class="se">\n</span><span class="s2">"</span><span class="o">.</span><span class="n">join</span><span class="p">(</span><span class="n">commands_to_execute</span><span class="p">)</span>
- <span class="k">try</span><span class="p">:</span>
- <span class="n">output</span> <span class="o">=</span> <span class="n">env</span><span class="o">.</span><span class="n">communicate</span><span class="p">(</span><span class="n">commands</span><span class="p">)</span>
- <span class="k">if</span> <span class="n">env</span><span class="o">.</span><span class="n">returncode</span> <span class="o">!=</span> <span class="mi">0</span><span class="p">:</span>
- <span class="n">msg</span> <span class="o">=</span> <span class="sa">f</span><span class="s2">"Nonzero return code: </span><span class="si">{</span><span class="n">env</span><span class="o">.</span><span class="n">returncode</span><span class="si">}</span><span class="se">\n</span><span class="s2">Output: </span><span class="si">{</span><span class="n">output</span><span class="si">}</span><span class="s2">"</span>
- <span class="k">raise</span> <span class="ne">RuntimeError</span><span class="p">(</span><span class="n">msg</span><span class="p">)</span>
- <span class="k">except</span> <span class="ne">KeyboardInterrupt</span><span class="p">:</span>
- <span class="k">raise</span>
- <span class="k">except</span> <span class="ne">Exception</span> <span class="k">as</span> <span class="n">e</span><span class="p">:</span>
- <span class="bp">self</span><span class="o">.</span><span class="n">logger</span><span class="o">.</span><span class="n">warning</span><span class="p">(</span><span class="sa">f</span><span class="s2">"Failed to set environment variables: </span><span class="si">{</span><span class="n">traceback</span><span class="o">.</span><span class="n">format_exc</span><span class="p">()</span><span class="si">}</span><span class="s2">"</span><span class="p">)</span>
- <span class="k">raise</span> <span class="n">e</span>
- <span class="n">command_files</span> <span class="o">=</span> <span class="nb">list</span><span class="p">()</span>
- <span class="k">for</span> <span class="n">file</span> <span class="ow">in</span> <span class="bp">self</span><span class="o">.</span><span class="n">config</span><span class="o">.</span><span class="n">command_files</span><span class="p">:</span>
- <span class="n">datum</span> <span class="o">=</span> <span class="nb">dict</span><span class="p">()</span>
- <span class="k">with</span> <span class="nb">open</span><span class="p">(</span><span class="n">file</span><span class="p">)</span> <span class="k">as</span> <span class="n">f</span><span class="p">:</span>
- <span class="n">contents</span> <span class="o">=</span> <span class="n">f</span><span class="o">.</span><span class="n">read</span><span class="p">()</span>
- <span class="n">datum</span><span class="p">[</span><span class="s2">"contents"</span><span class="p">]</span> <span class="o">=</span> <span class="n">contents</span>
- <span class="n">filename</span> <span class="o">=</span> <span class="n">Path</span><span class="p">(</span><span class="n">file</span><span class="p">)</span><span class="o">.</span><span class="n">name</span>
- <span class="k">if</span> <span class="ow">not</span> <span class="n">contents</span><span class="o">.</span><span class="n">strip</span><span class="p">()</span><span class="o">.</span><span class="n">startswith</span><span class="p">(</span><span class="s2">"#!"</span><span class="p">):</span>
- <span class="k">if</span> <span class="n">filename</span><span class="o">.</span><span class="n">endswith</span><span class="p">(</span><span class="s2">".sh"</span><span class="p">):</span>
- <span class="c1"># files are sourced, so they are not executable</span>
- <span class="n">datum</span><span class="p">[</span><span class="s2">"name"</span><span class="p">]</span> <span class="o">=</span> <span class="n">Path</span><span class="p">(</span><span class="n">file</span><span class="p">)</span><span class="o">.</span><span class="n">name</span>
- <span class="n">datum</span><span class="p">[</span><span class="s2">"type"</span><span class="p">]</span> <span class="o">=</span> <span class="s2">"source_file"</span>
- <span class="k">elif</span> <span class="n">filename</span><span class="o">.</span><span class="n">startswith</span><span class="p">(</span><span class="s2">"_"</span><span class="p">):</span>
- <span class="c1"># files are sourced, so they are not executable</span>
- <span class="n">datum</span><span class="p">[</span><span class="s2">"name"</span><span class="p">]</span> <span class="o">=</span> <span class="n">Path</span><span class="p">(</span><span class="n">file</span><span class="p">)</span><span class="o">.</span><span class="n">name</span>
- <span class="n">datum</span><span class="p">[</span><span class="s2">"type"</span><span class="p">]</span> <span class="o">=</span> <span class="s2">"utility"</span>
- <span class="k">else</span><span class="p">:</span>
- <span class="n">msg</span> <span class="o">=</span> <span class="p">(</span>
- <span class="sa">f</span><span class="s2">"Non-shell script file </span><span class="si">{</span><span class="n">file</span><span class="si">}</span><span class="s2"> does not start with shebang.</span><span class="se">\n</span><span class="s2">"</span>
- <span class="s2">"Either add a shebang (#!) or change the file extension to .sh if you want to source it.</span><span class="se">\n</span><span class="s2">"</span>
- <span class="s2">"You can override this behavior by adding an underscore to the file name (e.g. _utils.py)."</span>
- <span class="p">)</span>
- <span class="k">raise</span> <span class="ne">ValueError</span><span class="p">(</span><span class="n">msg</span><span class="p">)</span>
- <span class="k">else</span><span class="p">:</span>
- <span class="c1"># scripts are made executable</span>
- <span class="n">datum</span><span class="p">[</span><span class="s2">"name"</span><span class="p">]</span> <span class="o">=</span> <span class="n">Path</span><span class="p">(</span><span class="n">file</span><span class="p">)</span><span class="o">.</span><span class="n">name</span><span class="o">.</span><span class="n">rsplit</span><span class="p">(</span><span class="s2">"."</span><span class="p">,</span> <span class="mi">1</span><span class="p">)[</span><span class="mi">0</span><span class="p">]</span>
- <span class="n">datum</span><span class="p">[</span><span class="s2">"type"</span><span class="p">]</span> <span class="o">=</span> <span class="s2">"script"</span>
- <span class="n">command_files</span><span class="o">.</span><span class="n">append</span><span class="p">(</span><span class="n">datum</span><span class="p">)</span>
- <span class="n">env</span><span class="o">.</span><span class="n">add_commands</span><span class="p">(</span><span class="n">command_files</span><span class="p">)</span>
- </code></pre></div></td></tr></table></div>
- </details>
- </div>
- </div>
- <div class="doc doc-object doc-function">
- <h3 id="sweagent.agent.agents.Agent.setup" class="doc doc-heading">
- <code class="highlight language-python"><span class="n">setup</span><span class="p">(</span><span class="n">instance_args</span><span class="p">,</span> <span class="n">init_model_stats</span><span class="o">=</span><span class="kc">None</span><span class="p">)</span></code>
- </h3>
- <div class="doc doc-contents ">
- <p>Setup the agent for a new instance. This includes
- formatting the system message and adding demonstrations to the history.</p>
- <p><span class="doc-section-title">Parameters:</span></p>
- <table>
- <thead>
- <tr>
- <th>Name</th>
- <th>Type</th>
- <th>Description</th>
- <th>Default</th>
- </tr>
- </thead>
- <tbody>
- <tr class="doc-section-item">
- <td><code>instance_args</code></td>
- <td>
- <code>dict[str, <span title="typing.Any">Any</span>]</code>
- </td>
- <td>
- <div class="doc-md-description">
- <p>Arguments for the instance</p>
- </div>
- </td>
- <td>
- <em>required</em>
- </td>
- </tr>
- </tbody>
- </table>
- <details class="quote">
- <summary>Source code in <code>sweagent/agent/agents.py</code></summary>
- <div class="highlight"><table class="highlighttable"><tr><td class="linenos"><div class="linenodiv"><pre><span></span><span class="normal">359</span>
- <span class="normal">360</span>
- <span class="normal">361</span>
- <span class="normal">362</span>
- <span class="normal">363</span>
- <span class="normal">364</span>
- <span class="normal">365</span>
- <span class="normal">366</span>
- <span class="normal">367</span>
- <span class="normal">368</span>
- <span class="normal">369</span>
- <span class="normal">370</span>
- <span class="normal">371</span>
- <span class="normal">372</span>
- <span class="normal">373</span>
- <span class="normal">374</span>
- <span class="normal">375</span>
- <span class="normal">376</span>
- <span class="normal">377</span>
- <span class="normal">378</span>
- <span class="normal">379</span>
- <span class="normal">380</span></pre></div></td><td class="code"><div><pre><span></span><code><span class="k">def</span> <span class="nf">setup</span><span class="p">(</span><span class="bp">self</span><span class="p">,</span> <span class="n">instance_args</span><span class="p">:</span> <span class="nb">dict</span><span class="p">[</span><span class="nb">str</span><span class="p">,</span> <span class="n">Any</span><span class="p">],</span> <span class="n">init_model_stats</span><span class="p">:</span> <span class="n">APIStats</span> <span class="o">|</span> <span class="kc">None</span> <span class="o">=</span> <span class="kc">None</span><span class="p">)</span> <span class="o">-></span> <span class="kc">None</span><span class="p">:</span>
- <span class="w"> </span><span class="sd">"""Setup the agent for a new instance. This includes</span>
- <span class="sd"> formatting the system message and adding demonstrations to the history.</span>
- <span class="sd"> Args:</span>
- <span class="sd"> instance_args: Arguments for the instance</span>
- <span class="sd"> """</span>
- <span class="k">assert</span> <span class="bp">self</span><span class="o">.</span><span class="n">config</span> <span class="ow">is</span> <span class="ow">not</span> <span class="kc">None</span> <span class="c1"># mypy</span>
- <span class="bp">self</span><span class="o">.</span><span class="n">instance_args</span> <span class="o">=</span> <span class="n">instance_args</span>
- <span class="bp">self</span><span class="o">.</span><span class="n">_i_attempt</span> <span class="o">=</span> <span class="mi">0</span>
- <span class="bp">self</span><span class="o">.</span><span class="n">_history_by_attempt</span> <span class="o">=</span> <span class="n">defaultdict</span><span class="p">(</span><span class="nb">list</span><span class="p">)</span>
- <span class="bp">self</span><span class="o">.</span><span class="n">_trajectory_by_attempt</span> <span class="o">=</span> <span class="n">defaultdict</span><span class="p">(</span><span class="nb">list</span><span class="p">)</span>
- <span class="bp">self</span><span class="o">.</span><span class="n">_info_by_attempt</span> <span class="o">=</span> <span class="n">defaultdict</span><span class="p">(</span><span class="nb">dict</span><span class="p">)</span> <span class="c1"># type: ignore</span>
- <span class="bp">self</span><span class="o">.</span><span class="n">_forwarded_vars</span> <span class="o">=</span> <span class="p">{}</span>
- <span class="k">if</span> <span class="bp">self</span><span class="o">.</span><span class="n">_rloop</span> <span class="ow">is</span> <span class="ow">not</span> <span class="kc">None</span><span class="p">:</span>
- <span class="bp">self</span><span class="o">.</span><span class="n">_forwarded_vars</span> <span class="o">=</span> <span class="bp">self</span><span class="o">.</span><span class="n">_rloop</span><span class="o">.</span><span class="n">get_forwarded_vars</span><span class="p">()</span>
- <span class="bp">self</span><span class="o">.</span><span class="n">setup_attempt</span><span class="p">(</span><span class="n">init_model_stats</span><span class="o">=</span><span class="n">init_model_stats</span><span class="p">)</span>
- <span class="k">for</span> <span class="n">hook</span> <span class="ow">in</span> <span class="bp">self</span><span class="o">.</span><span class="n">hooks</span><span class="p">:</span>
- <span class="n">hook</span><span class="o">.</span><span class="n">on_setup_done</span><span class="p">()</span>
- </code></pre></div></td></tr></table></div>
- </details>
- </div>
- </div>
- <div class="doc doc-object doc-function">
- <h3 id="sweagent.agent.agents.Agent.setup_attempt" class="doc doc-heading">
- <code class="highlight language-python"><span class="n">setup_attempt</span><span class="p">(</span><span class="o">*</span><span class="p">,</span> <span class="n">init_model_stats</span><span class="o">=</span><span class="kc">None</span><span class="p">)</span></code>
- </h3>
- <div class="doc doc-contents ">
- <p>Setup the agent for a new attempt. This includes resetting the model stats.</p>
- <details class="quote">
- <summary>Source code in <code>sweagent/agent/agents.py</code></summary>
- <div class="highlight"><table class="highlighttable"><tr><td class="linenos"><div class="linenodiv"><pre><span></span><span class="normal">382</span>
- <span class="normal">383</span>
- <span class="normal">384</span>
- <span class="normal">385</span>
- <span class="normal">386</span>
- <span class="normal">387</span>
- <span class="normal">388</span>
- <span class="normal">389</span>
- <span class="normal">390</span>
- <span class="normal">391</span>
- <span class="normal">392</span>
- <span class="normal">393</span>
- <span class="normal">394</span>
- <span class="normal">395</span>
- <span class="normal">396</span>
- <span class="normal">397</span>
- <span class="normal">398</span>
- <span class="normal">399</span>
- <span class="normal">400</span>
- <span class="normal">401</span>
- <span class="normal">402</span>
- <span class="normal">403</span>
- <span class="normal">404</span>
- <span class="normal">405</span>
- <span class="normal">406</span>
- <span class="normal">407</span>
- <span class="normal">408</span>
- <span class="normal">409</span>
- <span class="normal">410</span>
- <span class="normal">411</span>
- <span class="normal">412</span>
- <span class="normal">413</span>
- <span class="normal">414</span>
- <span class="normal">415</span>
- <span class="normal">416</span>
- <span class="normal">417</span>
- <span class="normal">418</span>
- <span class="normal">419</span>
- <span class="normal">420</span>
- <span class="normal">421</span>
- <span class="normal">422</span>
- <span class="normal">423</span>
- <span class="normal">424</span>
- <span class="normal">425</span>
- <span class="normal">426</span>
- <span class="normal">427</span>
- <span class="normal">428</span>
- <span class="normal">429</span>
- <span class="normal">430</span>
- <span class="normal">431</span>
- <span class="normal">432</span>
- <span class="normal">433</span>
- <span class="normal">434</span>
- <span class="normal">435</span>
- <span class="normal">436</span>
- <span class="normal">437</span></pre></div></td><td class="code"><div><pre><span></span><code><span class="k">def</span> <span class="nf">setup_attempt</span><span class="p">(</span><span class="bp">self</span><span class="p">,</span> <span class="o">*</span><span class="p">,</span> <span class="n">init_model_stats</span><span class="p">:</span> <span class="n">APIStats</span> <span class="o">|</span> <span class="kc">None</span> <span class="o">=</span> <span class="kc">None</span><span class="p">)</span> <span class="o">-></span> <span class="kc">None</span><span class="p">:</span>
- <span class="w"> </span><span class="sd">"""Setup the agent for a new attempt. This includes resetting the model stats."""</span>
- <span class="k">assert</span> <span class="bp">self</span><span class="o">.</span><span class="n">config</span> <span class="ow">is</span> <span class="ow">not</span> <span class="kc">None</span> <span class="c1"># mypy</span>
- <span class="k">if</span> <span class="bp">self</span><span class="o">.</span><span class="n">_i_attempt</span> <span class="o">></span> <span class="mi">0</span> <span class="ow">and</span> <span class="n">init_model_stats</span> <span class="ow">is</span> <span class="ow">not</span> <span class="kc">None</span><span class="p">:</span>
- <span class="n">msg</span> <span class="o">=</span> <span class="p">(</span>
- <span class="s2">"We might be dealing with nested retries, where subroutines are mixed with retries. "</span>
- <span class="s2">"Currently, this messes up accounting with init_model_stats."</span>
- <span class="p">)</span>
- <span class="k">raise</span> <span class="ne">ValueError</span><span class="p">(</span><span class="n">msg</span><span class="p">)</span>
- <span class="k">if</span> <span class="bp">self</span><span class="o">.</span><span class="n">_i_attempt</span> <span class="o">></span> <span class="mi">0</span><span class="p">:</span>
- <span class="k">assert</span> <span class="bp">self</span><span class="o">.</span><span class="n">_env</span> <span class="ow">is</span> <span class="ow">not</span> <span class="kc">None</span> <span class="c1"># mypy</span>
- <span class="bp">self</span><span class="o">.</span><span class="n">_env</span><span class="o">.</span><span class="n">reset_for_new_attempt</span><span class="p">()</span>
- <span class="bp">self</span><span class="o">.</span><span class="n">model</span><span class="o">.</span><span class="n">reset_stats</span><span class="p">(</span><span class="n">init_model_stats</span><span class="p">)</span>
- <span class="c1"># self.model = get_model(self._args.model, self.config._commands + self.config.subroutine_types)</span>
- <span class="c1"># fixme: This doesn't reset total cost</span>
- <span class="n">system_msg</span> <span class="o">=</span> <span class="bp">self</span><span class="o">.</span><span class="n">config</span><span class="o">.</span><span class="n">system_template</span><span class="o">.</span><span class="n">format</span><span class="p">(</span><span class="o">**</span><span class="bp">self</span><span class="o">.</span><span class="n">system_args</span><span class="p">,</span> <span class="o">**</span><span class="bp">self</span><span class="o">.</span><span class="n">instance_args</span><span class="p">)</span>
- <span class="bp">self</span><span class="o">.</span><span class="n">logger</span><span class="o">.</span><span class="n">info</span><span class="p">(</span><span class="sa">f</span><span class="s2">"SYSTEM (</span><span class="si">{</span><span class="bp">self</span><span class="o">.</span><span class="n">name</span><span class="si">}</span><span class="s2">)</span><span class="se">\n</span><span class="si">{</span><span class="n">system_msg</span><span class="si">}</span><span class="s2">"</span><span class="p">)</span>
- <span class="bp">self</span><span class="o">.</span><span class="n">_append_history</span><span class="p">(</span><span class="n">HistoryItem</span><span class="p">({</span><span class="s2">"role"</span><span class="p">:</span> <span class="s2">"system"</span><span class="p">,</span> <span class="s2">"content"</span><span class="p">:</span> <span class="n">system_msg</span><span class="p">,</span> <span class="s2">"agent"</span><span class="p">:</span> <span class="bp">self</span><span class="o">.</span><span class="n">name</span><span class="p">}))</span>
- <span class="k">if</span> <span class="s2">"history_to_messages"</span> <span class="ow">in</span> <span class="nb">dir</span><span class="p">(</span><span class="bp">self</span><span class="o">.</span><span class="n">model</span><span class="p">):</span>
- <span class="k">for</span> <span class="n">demonstration_path</span> <span class="ow">in</span> <span class="bp">self</span><span class="o">.</span><span class="n">config</span><span class="o">.</span><span class="n">demonstrations</span><span class="p">:</span>
- <span class="k">if</span> <span class="bp">self</span><span class="o">.</span><span class="n">config</span><span class="o">.</span><span class="n">demonstration_template</span> <span class="ow">is</span> <span class="kc">None</span> <span class="ow">and</span> <span class="ow">not</span> <span class="bp">self</span><span class="o">.</span><span class="n">config</span><span class="o">.</span><span class="n">put_demos_in_history</span><span class="p">:</span>
- <span class="n">msg</span> <span class="o">=</span> <span class="s2">"Cannot use demonstrations without a demonstration template or put_demos_in_history=True"</span>
- <span class="k">raise</span> <span class="ne">ValueError</span><span class="p">(</span><span class="n">msg</span><span class="p">)</span>
- <span class="c1"># Load history</span>
- <span class="bp">self</span><span class="o">.</span><span class="n">logger</span><span class="o">.</span><span class="n">info</span><span class="p">(</span><span class="sa">f</span><span class="s2">"DEMONSTRATION: </span><span class="si">{</span><span class="n">demonstration_path</span><span class="si">}</span><span class="s2">"</span><span class="p">)</span>
- <span class="n">demo_history</span> <span class="o">=</span> <span class="n">json</span><span class="o">.</span><span class="n">loads</span><span class="p">(</span><span class="n">Path</span><span class="p">(</span><span class="n">demonstration_path</span><span class="p">)</span><span class="o">.</span><span class="n">read_text</span><span class="p">())[</span><span class="s2">"history"</span><span class="p">]</span>
- <span class="n">demo_history</span> <span class="o">=</span> <span class="p">[</span>
- <span class="n">entry</span>
- <span class="k">for</span> <span class="n">entry</span> <span class="ow">in</span> <span class="n">demo_history</span>
- <span class="k">if</span> <span class="p">(</span><span class="s2">"agent"</span> <span class="ow">not</span> <span class="ow">in</span> <span class="n">entry</span><span class="p">)</span> <span class="ow">or</span> <span class="p">(</span><span class="s2">"agent"</span> <span class="ow">in</span> <span class="n">entry</span> <span class="ow">and</span> <span class="n">entry</span><span class="p">[</span><span class="s2">"agent"</span><span class="p">]</span> <span class="o">==</span> <span class="bp">self</span><span class="o">.</span><span class="n">name</span><span class="p">)</span>
- <span class="p">]</span>
- <span class="k">if</span> <span class="bp">self</span><span class="o">.</span><span class="n">config</span><span class="o">.</span><span class="n">put_demos_in_history</span><span class="p">:</span>
- <span class="k">if</span> <span class="bp">self</span><span class="o">.</span><span class="n">config</span><span class="o">.</span><span class="n">demonstration_template</span> <span class="ow">is</span> <span class="ow">not</span> <span class="kc">None</span><span class="p">:</span>
- <span class="bp">self</span><span class="o">.</span><span class="n">logger</span><span class="o">.</span><span class="n">warning</span><span class="p">(</span><span class="s2">"Demonstration template is ignored for put_demos_in_history=True"</span><span class="p">)</span>
- <span class="c1"># Add demonstration to history directly as separate messages</span>
- <span class="k">for</span> <span class="n">entry</span> <span class="ow">in</span> <span class="n">demo_history</span><span class="p">:</span>
- <span class="k">if</span> <span class="n">entry</span><span class="p">[</span><span class="s2">"role"</span><span class="p">]</span> <span class="o">!=</span> <span class="s2">"system"</span><span class="p">:</span>
- <span class="n">entry</span><span class="p">[</span><span class="s2">"is_demo"</span><span class="p">]</span> <span class="o">=</span> <span class="kc">True</span>
- <span class="bp">self</span><span class="o">.</span><span class="n">_append_history</span><span class="p">(</span><span class="n">entry</span><span class="p">)</span>
- <span class="k">else</span><span class="p">:</span>
- <span class="c1"># Add demonstration as single message to history</span>
- <span class="n">demo_message</span> <span class="o">=</span> <span class="bp">self</span><span class="o">.</span><span class="n">model</span><span class="o">.</span><span class="n">history_to_messages</span><span class="p">(</span>
- <span class="n">demo_history</span><span class="p">,</span>
- <span class="n">is_demonstration</span><span class="o">=</span><span class="kc">True</span><span class="p">,</span>
- <span class="p">)</span>
- <span class="n">demonstration</span> <span class="o">=</span> <span class="bp">self</span><span class="o">.</span><span class="n">config</span><span class="o">.</span><span class="n">demonstration_template</span><span class="o">.</span><span class="n">format</span><span class="p">(</span><span class="n">demonstration</span><span class="o">=</span><span class="n">demo_message</span><span class="p">)</span>
- <span class="bp">self</span><span class="o">.</span><span class="n">_append_history</span><span class="p">(</span>
- <span class="p">{</span>
- <span class="s2">"agent"</span><span class="p">:</span> <span class="bp">self</span><span class="o">.</span><span class="n">name</span><span class="p">,</span>
- <span class="s2">"content"</span><span class="p">:</span> <span class="n">demonstration</span><span class="p">,</span>
- <span class="s2">"is_demo"</span><span class="p">:</span> <span class="kc">True</span><span class="p">,</span>
- <span class="s2">"role"</span><span class="p">:</span> <span class="s2">"user"</span><span class="p">,</span>
- <span class="p">},</span>
- <span class="p">)</span>
- </code></pre></div></td></tr></table></div>
- </details>
- </div>
- </div>
- <div class="doc doc-object doc-function">
- <h3 id="sweagent.agent.agents.Agent.should_block_action" class="doc doc-heading">
- <code class="highlight language-python"><span class="n">should_block_action</span><span class="p">(</span><span class="n">action</span><span class="p">)</span></code>
- </h3>
- <div class="doc doc-contents ">
- <p>Check if the command should be blocked.</p>
- <details class="quote">
- <summary>Source code in <code>sweagent/agent/agents.py</code></summary>
- <div class="highlight"><table class="highlighttable"><tr><td class="linenos"><div class="linenodiv"><pre><span></span><span class="normal">730</span>
- <span class="normal">731</span>
- <span class="normal">732</span>
- <span class="normal">733</span>
- <span class="normal">734</span>
- <span class="normal">735</span>
- <span class="normal">736</span>
- <span class="normal">737</span>
- <span class="normal">738</span>
- <span class="normal">739</span>
- <span class="normal">740</span>
- <span class="normal">741</span>
- <span class="normal">742</span></pre></div></td><td class="code"><div><pre><span></span><code><span class="k">def</span> <span class="nf">should_block_action</span><span class="p">(</span><span class="bp">self</span><span class="p">,</span> <span class="n">action</span><span class="p">:</span> <span class="nb">str</span><span class="p">)</span> <span class="o">-></span> <span class="nb">bool</span><span class="p">:</span>
- <span class="w"> </span><span class="sd">"""Check if the command should be blocked."""</span>
- <span class="n">names</span> <span class="o">=</span> <span class="n">action</span><span class="o">.</span><span class="n">strip</span><span class="p">()</span><span class="o">.</span><span class="n">split</span><span class="p">()</span>
- <span class="k">if</span> <span class="nb">len</span><span class="p">(</span><span class="n">names</span><span class="p">)</span> <span class="o">==</span> <span class="mi">0</span><span class="p">:</span>
- <span class="k">return</span> <span class="kc">False</span>
- <span class="n">name</span> <span class="o">=</span> <span class="n">names</span><span class="p">[</span><span class="mi">0</span><span class="p">]</span>
- <span class="k">if</span> <span class="n">name</span> <span class="ow">in</span> <span class="bp">self</span><span class="o">.</span><span class="n">config</span><span class="o">.</span><span class="n">blocklist</span><span class="p">:</span>
- <span class="k">return</span> <span class="kc">True</span>
- <span class="k">if</span> <span class="n">name</span> <span class="ow">in</span> <span class="bp">self</span><span class="o">.</span><span class="n">config</span><span class="o">.</span><span class="n">blocklist_standalone</span> <span class="ow">and</span> <span class="n">name</span> <span class="o">==</span> <span class="n">action</span><span class="o">.</span><span class="n">strip</span><span class="p">():</span>
- <span class="k">return</span> <span class="kc">True</span>
- <span class="k">if</span> <span class="n">name</span> <span class="ow">in</span> <span class="bp">self</span><span class="o">.</span><span class="n">config</span><span class="o">.</span><span class="n">block_unless_regex</span> <span class="ow">and</span> <span class="ow">not</span> <span class="n">re</span><span class="o">.</span><span class="n">search</span><span class="p">(</span><span class="bp">self</span><span class="o">.</span><span class="n">config</span><span class="o">.</span><span class="n">block_unless_regex</span><span class="p">[</span><span class="n">name</span><span class="p">],</span> <span class="n">action</span><span class="p">):</span>
- <span class="k">return</span> <span class="kc">True</span>
- <span class="k">return</span> <span class="kc">False</span>
- </code></pre></div></td></tr></table></div>
- </details>
- </div>
- </div>
- <div class="doc doc-object doc-function">
- <h3 id="sweagent.agent.agents.Agent.split_actions" class="doc doc-heading">
- <code class="highlight language-python"><span class="n">split_actions</span><span class="p">(</span><span class="n">action</span><span class="p">,</span> <span class="n">pattern_type</span><span class="o">=</span><span class="s1">'subroutine'</span><span class="p">)</span></code>
- </h3>
- <div class="doc doc-contents ">
- <p>Split an action into a list of actions in a greedy manner, each of which is a subroutine call or a single command.</p>
- <details class="quote">
- <summary>Source code in <code>sweagent/agent/agents.py</code></summary>
- <div class="highlight"><table class="highlighttable"><tr><td class="linenos"><div class="linenodiv"><pre><span></span><span class="normal">548</span>
- <span class="normal">549</span>
- <span class="normal">550</span>
- <span class="normal">551</span>
- <span class="normal">552</span>
- <span class="normal">553</span>
- <span class="normal">554</span>
- <span class="normal">555</span>
- <span class="normal">556</span>
- <span class="normal">557</span>
- <span class="normal">558</span>
- <span class="normal">559</span>
- <span class="normal">560</span>
- <span class="normal">561</span>
- <span class="normal">562</span>
- <span class="normal">563</span>
- <span class="normal">564</span>
- <span class="normal">565</span>
- <span class="normal">566</span>
- <span class="normal">567</span>
- <span class="normal">568</span>
- <span class="normal">569</span>
- <span class="normal">570</span>
- <span class="normal">571</span>
- <span class="normal">572</span>
- <span class="normal">573</span>
- <span class="normal">574</span>
- <span class="normal">575</span>
- <span class="normal">576</span>
- <span class="normal">577</span>
- <span class="normal">578</span>
- <span class="normal">579</span>
- <span class="normal">580</span>
- <span class="normal">581</span>
- <span class="normal">582</span>
- <span class="normal">583</span>
- <span class="normal">584</span>
- <span class="normal">585</span>
- <span class="normal">586</span>
- <span class="normal">587</span>
- <span class="normal">588</span></pre></div></td><td class="code"><div><pre><span></span><code><span class="k">def</span> <span class="nf">split_actions</span><span class="p">(</span><span class="bp">self</span><span class="p">,</span> <span class="n">action</span><span class="p">:</span> <span class="nb">str</span><span class="p">,</span> <span class="n">pattern_type</span><span class="o">=</span><span class="s2">"subroutine"</span><span class="p">)</span> <span class="o">-></span> <span class="nb">list</span><span class="p">[</span><span class="n">SubAction</span><span class="p">]:</span>
- <span class="w"> </span><span class="sd">"""Split an action into a list of actions in a greedy manner, each of which is a subroutine call or a single command."""</span>
- <span class="n">parsed_action</span><span class="p">:</span> <span class="nb">list</span><span class="p">[</span><span class="n">SubAction</span><span class="p">]</span> <span class="o">=</span> <span class="nb">list</span><span class="p">()</span>
- <span class="n">rem_action</span> <span class="o">=</span> <span class="n">action</span>
- <span class="k">while</span> <span class="n">rem_action</span><span class="o">.</span><span class="n">strip</span><span class="p">():</span>
- <span class="n">first_match</span> <span class="o">=</span> <span class="bp">self</span><span class="o">.</span><span class="n">_get_first_match</span><span class="p">(</span><span class="n">rem_action</span><span class="p">,</span> <span class="n">pattern_type</span><span class="p">)</span>
- <span class="k">if</span> <span class="n">first_match</span><span class="p">:</span>
- <span class="n">pre_action</span> <span class="o">=</span> <span class="n">rem_action</span><span class="p">[:</span> <span class="n">first_match</span><span class="o">.</span><span class="n">start</span><span class="p">()]</span>
- <span class="n">match_action</span> <span class="o">=</span> <span class="n">rem_action</span><span class="p">[</span><span class="n">first_match</span><span class="o">.</span><span class="n">start</span><span class="p">()</span> <span class="p">:</span> <span class="n">first_match</span><span class="o">.</span><span class="n">end</span><span class="p">()]</span>
- <span class="n">rem_action</span> <span class="o">=</span> <span class="n">rem_action</span><span class="p">[</span><span class="n">first_match</span><span class="o">.</span><span class="n">end</span><span class="p">()</span> <span class="p">:]</span>
- <span class="k">if</span> <span class="n">pre_action</span><span class="o">.</span><span class="n">strip</span><span class="p">():</span>
- <span class="n">parsed_action</span><span class="o">.</span><span class="n">append</span><span class="p">({</span><span class="s2">"agent"</span><span class="p">:</span> <span class="bp">self</span><span class="o">.</span><span class="n">name</span><span class="p">,</span> <span class="s2">"action"</span><span class="p">:</span> <span class="n">pre_action</span><span class="p">,</span> <span class="s2">"cmd_name"</span><span class="p">:</span> <span class="kc">None</span><span class="p">,</span> <span class="s2">"args"</span><span class="p">:</span> <span class="s2">""</span><span class="p">})</span>
- <span class="k">if</span> <span class="n">match_action</span><span class="o">.</span><span class="n">strip</span><span class="p">():</span>
- <span class="k">if</span> <span class="n">match_action</span><span class="o">.</span><span class="n">split</span><span class="p">()[</span><span class="mi">0</span><span class="p">]</span> <span class="o">==</span> <span class="bp">self</span><span class="o">.</span><span class="n">config</span><span class="o">.</span><span class="n">submit_command</span><span class="p">:</span>
- <span class="n">parsed_action</span><span class="o">.</span><span class="n">append</span><span class="p">(</span>
- <span class="n">SubAction</span><span class="p">(</span>
- <span class="p">{</span>
- <span class="s2">"agent"</span><span class="p">:</span> <span class="bp">self</span><span class="o">.</span><span class="n">name</span><span class="p">,</span>
- <span class="s2">"action"</span><span class="p">:</span> <span class="n">match_action</span><span class="p">,</span>
- <span class="s2">"cmd_name"</span><span class="p">:</span> <span class="n">first_match</span><span class="o">.</span><span class="n">group</span><span class="p">(</span><span class="mi">1</span><span class="p">),</span>
- <span class="s2">"args"</span><span class="p">:</span> <span class="s2">""</span><span class="p">,</span>
- <span class="p">},</span>
- <span class="p">)</span>
- <span class="p">)</span> <span class="c1"># submit command is not a subroutine</span>
- <span class="k">else</span><span class="p">:</span>
- <span class="n">parsed_action</span><span class="o">.</span><span class="n">append</span><span class="p">(</span>
- <span class="n">SubAction</span><span class="p">(</span>
- <span class="p">{</span>
- <span class="s2">"agent"</span><span class="p">:</span> <span class="n">first_match</span><span class="o">.</span><span class="n">group</span><span class="p">(</span><span class="mi">1</span><span class="p">),</span>
- <span class="s2">"args"</span><span class="p">:</span> <span class="n">first_match</span><span class="o">.</span><span class="n">group</span><span class="p">(</span><span class="mi">2</span><span class="p">),</span>
- <span class="s2">"action"</span><span class="p">:</span> <span class="n">match_action</span><span class="p">,</span>
- <span class="s2">"cmd_name"</span><span class="p">:</span> <span class="n">first_match</span><span class="o">.</span><span class="n">group</span><span class="p">(</span><span class="mi">1</span><span class="p">),</span>
- <span class="p">},</span>
- <span class="p">)</span>
- <span class="p">)</span>
- <span class="k">else</span><span class="p">:</span>
- <span class="n">parsed_action</span><span class="o">.</span><span class="n">append</span><span class="p">(</span>
- <span class="n">SubAction</span><span class="p">({</span><span class="s2">"agent"</span><span class="p">:</span> <span class="bp">self</span><span class="o">.</span><span class="n">name</span><span class="p">,</span> <span class="s2">"action"</span><span class="p">:</span> <span class="n">rem_action</span><span class="p">,</span> <span class="s2">"cmd_name"</span><span class="p">:</span> <span class="kc">None</span><span class="p">,</span> <span class="s2">"args"</span><span class="p">:</span> <span class="s2">""</span><span class="p">})</span>
- <span class="p">)</span>
- <span class="n">rem_action</span> <span class="o">=</span> <span class="s2">""</span>
- <span class="k">return</span> <span class="n">parsed_action</span>
- </code></pre></div></td></tr></table></div>
- </details>
- </div>
- </div>
- </div>
- </div>
- </div>
- <div class="doc doc-object doc-class">
- <h2 id="sweagent.agent.agents.AgentArguments" class="doc doc-heading">
- <code>AgentArguments</code>
- <span class="doc doc-labels">
- <small class="doc doc-label doc-label-dataclass"><code>dataclass</code></small>
- </span>
- </h2>
- <div class="doc doc-contents ">
- <p class="doc doc-class-bases">
- Bases: <code><span title="simple_parsing.helpers.flatten.FlattenedAccess">FlattenedAccess</span></code>, <code><span title="simple_parsing.helpers.serialization.serializable.FrozenSerializable">FrozenSerializable</span></code></p>
- <p>Configure the agent's behaviour (templates, parse functions, blocklists, ...).</p>
- <details class="quote">
- <summary>Source code in <code>sweagent/agent/agents.py</code></summary>
- <div class="highlight"><table class="highlighttable"><tr><td class="linenos"><div class="linenodiv"><pre><span></span><span class="normal">191</span>
- <span class="normal">192</span>
- <span class="normal">193</span>
- <span class="normal">194</span>
- <span class="normal">195</span>
- <span class="normal">196</span>
- <span class="normal">197</span>
- <span class="normal">198</span>
- <span class="normal">199</span>
- <span class="normal">200</span>
- <span class="normal">201</span>
- <span class="normal">202</span>
- <span class="normal">203</span>
- <span class="normal">204</span>
- <span class="normal">205</span>
- <span class="normal">206</span>
- <span class="normal">207</span>
- <span class="normal">208</span>
- <span class="normal">209</span>
- <span class="normal">210</span>
- <span class="normal">211</span>
- <span class="normal">212</span>
- <span class="normal">213</span>
- <span class="normal">214</span></pre></div></td><td class="code"><div><pre><span></span><code><span class="nd">@dataclass</span><span class="p">(</span><span class="n">frozen</span><span class="o">=</span><span class="kc">True</span><span class="p">)</span>
- <span class="k">class</span> <span class="nc">AgentArguments</span><span class="p">(</span><span class="n">FlattenedAccess</span><span class="p">,</span> <span class="n">FrozenSerializable</span><span class="p">):</span>
- <span class="w"> </span><span class="sd">"""Configure the agent's behaviour (templates, parse functions, blocklists, ...)."""</span>
- <span class="n">model</span><span class="p">:</span> <span class="n">ModelArguments</span> <span class="o">=</span> <span class="kc">None</span>
- <span class="c1"># Policy can only be set via config yaml file from command line</span>
- <span class="n">config_file</span><span class="p">:</span> <span class="n">Path</span> <span class="o">|</span> <span class="kc">None</span> <span class="o">=</span> <span class="kc">None</span>
- <span class="n">config</span><span class="p">:</span> <span class="n">AgentConfig</span> <span class="o">|</span> <span class="kc">None</span> <span class="o">=</span> <span class="n">field</span><span class="p">(</span><span class="n">default</span><span class="o">=</span><span class="kc">None</span><span class="p">,</span> <span class="n">cmd</span><span class="o">=</span><span class="kc">False</span><span class="p">)</span>
- <span class="k">def</span> <span class="nf">__post_init__</span><span class="p">(</span><span class="bp">self</span><span class="p">):</span>
- <span class="k">if</span> <span class="bp">self</span><span class="o">.</span><span class="n">config</span> <span class="ow">is</span> <span class="kc">None</span> <span class="ow">and</span> <span class="bp">self</span><span class="o">.</span><span class="n">config_file</span> <span class="ow">is</span> <span class="ow">not</span> <span class="kc">None</span><span class="p">:</span>
- <span class="c1"># If unassigned, we load the config from the file to store its contents with the overall arguments</span>
- <span class="n">config</span> <span class="o">=</span> <span class="n">AgentConfig</span><span class="o">.</span><span class="n">load_yaml</span><span class="p">(</span><span class="bp">self</span><span class="o">.</span><span class="n">config_file</span><span class="p">)</span>
- <span class="nb">object</span><span class="o">.</span><span class="fm">__setattr__</span><span class="p">(</span><span class="bp">self</span><span class="p">,</span> <span class="s2">"config"</span><span class="p">,</span> <span class="n">config</span><span class="p">)</span>
- <span class="k">assert</span> <span class="bp">self</span><span class="o">.</span><span class="n">config</span> <span class="ow">is</span> <span class="ow">not</span> <span class="kc">None</span> <span class="c1"># mypy</span>
- <span class="k">for</span> <span class="n">subroutine</span> <span class="ow">in</span> <span class="nb">getattr</span><span class="p">(</span><span class="bp">self</span><span class="o">.</span><span class="n">config</span><span class="p">,</span> <span class="s2">"subroutines"</span><span class="p">,</span> <span class="p">{})</span><span class="o">.</span><span class="n">values</span><span class="p">():</span>
- <span class="n">model_args</span> <span class="o">=</span> <span class="n">subroutine</span><span class="o">.</span><span class="n">model</span>
- <span class="nb">object</span><span class="o">.</span><span class="fm">__setattr__</span><span class="p">(</span>
- <span class="n">model_args</span><span class="p">,</span>
- <span class="s2">"per_instance_cost_limit"</span><span class="p">,</span>
- <span class="bp">self</span><span class="o">.</span><span class="n">model</span><span class="o">.</span><span class="n">per_instance_cost_limit</span><span class="p">,</span>
- <span class="p">)</span>
- <span class="nb">object</span><span class="o">.</span><span class="fm">__setattr__</span><span class="p">(</span><span class="n">model_args</span><span class="p">,</span> <span class="s2">"total_cost_limit"</span><span class="p">,</span> <span class="bp">self</span><span class="o">.</span><span class="n">model</span><span class="o">.</span><span class="n">total_cost_limit</span><span class="p">)</span>
- </code></pre></div></td></tr></table></div>
- </details>
- <div class="doc doc-children">
- </div>
- </div>
- </div>
- <div class="doc doc-object doc-class">
- <h2 id="sweagent.agent.agents.AgentHook" class="doc doc-heading">
- <code>AgentHook</code>
- </h2>
- <div class="doc doc-contents ">
- <details class="quote">
- <summary>Source code in <code>sweagent/agent/agents.py</code></summary>
- <div class="highlight"><table class="highlighttable"><tr><td class="linenos"><div class="linenodiv"><pre><span></span><span class="normal">217</span>
- <span class="normal">218</span>
- <span class="normal">219</span>
- <span class="normal">220</span>
- <span class="normal">221</span>
- <span class="normal">222</span>
- <span class="normal">223</span>
- <span class="normal">224</span>
- <span class="normal">225</span>
- <span class="normal">226</span>
- <span class="normal">227</span>
- <span class="normal">228</span>
- <span class="normal">229</span>
- <span class="normal">230</span>
- <span class="normal">231</span>
- <span class="normal">232</span>
- <span class="normal">233</span>
- <span class="normal">234</span>
- <span class="normal">235</span>
- <span class="normal">236</span>
- <span class="normal">237</span>
- <span class="normal">238</span>
- <span class="normal">239</span>
- <span class="normal">240</span>
- <span class="normal">241</span>
- <span class="normal">242</span>
- <span class="normal">243</span>
- <span class="normal">244</span>
- <span class="normal">245</span>
- <span class="normal">246</span>
- <span class="normal">247</span>
- <span class="normal">248</span>
- <span class="normal">249</span>
- <span class="normal">250</span>
- <span class="normal">251</span>
- <span class="normal">252</span>
- <span class="normal">253</span></pre></div></td><td class="code"><div><pre><span></span><code><span class="k">class</span> <span class="nc">AgentHook</span><span class="p">:</span>
- <span class="k">def</span> <span class="nf">on_init</span><span class="p">(</span><span class="bp">self</span><span class="p">,</span> <span class="o">*</span><span class="p">,</span> <span class="n">agent</span><span class="p">:</span> <span class="n">Agent</span><span class="p">):</span>
- <span class="w"> </span><span class="sd">"""Note: Depending on the internals of `Agent` should be done with care,</span>
- <span class="sd"> it's best to use this as little as possible.</span>
- <span class="sd"> """</span>
- <span class="k">def</span> <span class="nf">on_run_start</span><span class="p">(</span>
- <span class="bp">self</span><span class="p">,</span>
- <span class="p">):</span> <span class="o">...</span>
- <span class="k">def</span> <span class="nf">on_step_start</span><span class="p">(</span><span class="bp">self</span><span class="p">):</span> <span class="o">...</span>
- <span class="k">def</span> <span class="nf">on_actions_generated</span><span class="p">(</span><span class="bp">self</span><span class="p">,</span> <span class="o">*</span><span class="p">,</span> <span class="n">thought</span><span class="p">:</span> <span class="nb">str</span><span class="p">,</span> <span class="n">action</span><span class="p">:</span> <span class="nb">str</span><span class="p">,</span> <span class="n">output</span><span class="p">:</span> <span class="nb">str</span><span class="p">):</span> <span class="o">...</span>
- <span class="k">def</span> <span class="nf">on_sub_action_started</span><span class="p">(</span><span class="bp">self</span><span class="p">,</span> <span class="o">*</span><span class="p">,</span> <span class="n">sub_action</span><span class="p">:</span> <span class="nb">str</span><span class="p">):</span> <span class="o">...</span>
- <span class="k">def</span> <span class="nf">on_sub_action_executed</span><span class="p">(</span><span class="bp">self</span><span class="p">,</span> <span class="o">*</span><span class="p">,</span> <span class="n">obs</span><span class="p">:</span> <span class="nb">str</span><span class="p">,</span> <span class="n">done</span><span class="p">:</span> <span class="nb">bool</span><span class="p">):</span> <span class="o">...</span>
- <span class="k">def</span> <span class="nf">on_step_done</span><span class="p">(</span><span class="bp">self</span><span class="p">,</span> <span class="o">*</span><span class="p">,</span> <span class="n">trajectory_step</span><span class="p">:</span> <span class="n">TrajectoryStep</span><span class="p">,</span> <span class="n">model_stats</span><span class="p">:</span> <span class="n">APIStats</span><span class="p">):</span> <span class="o">...</span>
- <span class="k">def</span> <span class="nf">on_run_done</span><span class="p">(</span><span class="bp">self</span><span class="p">,</span> <span class="o">*</span><span class="p">,</span> <span class="n">trajectory</span><span class="p">:</span> <span class="n">Trajectory</span><span class="p">,</span> <span class="n">info</span><span class="p">:</span> <span class="n">AgentInfo</span><span class="p">):</span> <span class="o">...</span>
- <span class="k">def</span> <span class="nf">on_model_query</span><span class="p">(</span><span class="bp">self</span><span class="p">,</span> <span class="o">*</span><span class="p">,</span> <span class="n">query</span><span class="p">:</span> <span class="nb">str</span><span class="p">,</span> <span class="n">agent</span><span class="p">:</span> <span class="nb">str</span><span class="p">):</span>
- <span class="w"> </span><span class="sd">"""Actually query the model with the complete history."""</span>
- <span class="k">def</span> <span class="nf">on_query_message_added</span><span class="p">(</span>
- <span class="bp">self</span><span class="p">,</span>
- <span class="o">*</span><span class="p">,</span>
- <span class="n">role</span><span class="p">:</span> <span class="nb">str</span><span class="p">,</span>
- <span class="n">content</span><span class="p">:</span> <span class="nb">str</span><span class="p">,</span>
- <span class="n">agent</span><span class="p">:</span> <span class="nb">str</span><span class="p">,</span>
- <span class="n">is_demo</span><span class="p">:</span> <span class="nb">bool</span> <span class="o">=</span> <span class="kc">False</span><span class="p">,</span>
- <span class="n">thought</span><span class="p">:</span> <span class="nb">str</span> <span class="o">=</span> <span class="s2">""</span><span class="p">,</span>
- <span class="n">action</span><span class="p">:</span> <span class="nb">str</span> <span class="o">=</span> <span class="s2">""</span><span class="p">,</span>
- <span class="p">):</span> <span class="o">...</span>
- <span class="k">def</span> <span class="nf">on_setup_done</span><span class="p">(</span><span class="bp">self</span><span class="p">):</span> <span class="o">...</span>
- </code></pre></div></td></tr></table></div>
- </details>
- <div class="doc doc-children">
- <div class="doc doc-object doc-function">
- <h3 id="sweagent.agent.agents.AgentHook.on_init" class="doc doc-heading">
- <code class="highlight language-python"><span class="n">on_init</span><span class="p">(</span><span class="o">*</span><span class="p">,</span> <span class="n">agent</span><span class="p">)</span></code>
- </h3>
- <div class="doc doc-contents ">
- <p>Note: Depending on the internals of <code>Agent</code> should be done with care,
- it's best to use this as little as possible.</p>
- <details class="quote">
- <summary>Source code in <code>sweagent/agent/agents.py</code></summary>
- <div class="highlight"><table class="highlighttable"><tr><td class="linenos"><div class="linenodiv"><pre><span></span><span class="normal">218</span>
- <span class="normal">219</span>
- <span class="normal">220</span>
- <span class="normal">221</span></pre></div></td><td class="code"><div><pre><span></span><code><span class="k">def</span> <span class="nf">on_init</span><span class="p">(</span><span class="bp">self</span><span class="p">,</span> <span class="o">*</span><span class="p">,</span> <span class="n">agent</span><span class="p">:</span> <span class="n">Agent</span><span class="p">):</span>
- <span class="w"> </span><span class="sd">"""Note: Depending on the internals of `Agent` should be done with care,</span>
- <span class="sd"> it's best to use this as little as possible.</span>
- <span class="sd"> """</span>
- </code></pre></div></td></tr></table></div>
- </details>
- </div>
- </div>
- <div class="doc doc-object doc-function">
- <h3 id="sweagent.agent.agents.AgentHook.on_model_query" class="doc doc-heading">
- <code class="highlight language-python"><span class="n">on_model_query</span><span class="p">(</span><span class="o">*</span><span class="p">,</span> <span class="n">query</span><span class="p">,</span> <span class="n">agent</span><span class="p">)</span></code>
- </h3>
- <div class="doc doc-contents ">
- <p>Actually query the model with the complete history.</p>
- <details class="quote">
- <summary>Source code in <code>sweagent/agent/agents.py</code></summary>
- <div class="highlight"><table class="highlighttable"><tr><td class="linenos"><div class="linenodiv"><pre><span></span><span class="normal">239</span>
- <span class="normal">240</span></pre></div></td><td class="code"><div><pre><span></span><code><span class="k">def</span> <span class="nf">on_model_query</span><span class="p">(</span><span class="bp">self</span><span class="p">,</span> <span class="o">*</span><span class="p">,</span> <span class="n">query</span><span class="p">:</span> <span class="nb">str</span><span class="p">,</span> <span class="n">agent</span><span class="p">:</span> <span class="nb">str</span><span class="p">):</span>
- <span class="w"> </span><span class="sd">"""Actually query the model with the complete history."""</span>
- </code></pre></div></td></tr></table></div>
- </details>
- </div>
- </div>
- </div>
- </div>
- </div>
- </div>
- </div>
- </div>
-
- </article>
- </div>
-
-
- <script>var target=document.getElementById(location.hash.slice(1));target&&target.name&&(target.checked=target.name.startsWith("__tabbed_"))</script>
- </div>
-
- </main>
-
- <footer class="md-footer">
-
-
-
- <nav class="md-footer__inner md-grid" aria-label="Footer" >
-
-
- <a href="../" class="md-footer__link md-footer__link--prev" aria-label="Previous: Code structure and reference">
- <div class="md-footer__button md-icon">
-
- <svg xmlns="http://www.w3.org/2000/svg" viewBox="0 0 24 24"><path d="M20 11v2H8l5.5 5.5-1.42 1.42L4.16 12l7.92-7.92L13.5 5.5 8 11z"/></svg>
- </div>
- <div class="md-footer__title">
- <span class="md-footer__direction">
- Previous
- </span>
- <div class="md-ellipsis">
- Code structure and reference
- </div>
- </div>
- </a>
-
-
-
- <a href="../models/" class="md-footer__link md-footer__link--next" aria-label="Next: Models">
- <div class="md-footer__title">
- <span class="md-footer__direction">
- Next
- </span>
- <div class="md-ellipsis">
- Models
- </div>
- </div>
- <div class="md-footer__button md-icon">
-
- <svg xmlns="http://www.w3.org/2000/svg" viewBox="0 0 24 24"><path d="M4 11v2h12l-5.5 5.5 1.42 1.42L19.84 12l-7.92-7.92L10.5 5.5 16 11z"/></svg>
- </div>
- </a>
-
- </nav>
-
-
- <div class="md-footer-meta md-typeset">
- <div class="md-footer-meta__inner md-grid">
- <div class="md-copyright">
-
-
- Made with
- <a href="https://squidfunk.github.io/mkdocs-material/" target="_blank" rel="noopener">
- Material for MkDocs
- </a>
-
- </div>
-
- </div>
- </div>
- </footer>
-
- </div>
- <div class="md-dialog" data-md-component="dialog">
- <div class="md-dialog__inner md-typeset"></div>
- </div>
-
-
- <script id="__config" type="application/json">{"base": "../..", "features": ["navigation.indexes", "content.action.edit", "navigation.footer", "content.code.copy", "content.footnote.tooltips", "header.autohide", "announce.dismiss"], "search": "../../assets/javascripts/workers/search.6ce7567c.min.js", "translations": {"clipboard.copied": "Copied to clipboard", "clipboard.copy": "Copy to clipboard", "search.result.more.one": "1 more on this page", "search.result.more.other": "# more on this page", "search.result.none": "No matching documents", "search.result.one": "1 matching document", "search.result.other": "# matching documents", "search.result.placeholder": "Type to start searching", "search.result.term.missing": "Missing", "select.version": "Select version"}}</script>
-
-
- <script src="../../assets/javascripts/bundle.525ec568.min.js"></script>
-
-
- <script id="init-glightbox">const lightbox = GLightbox({"touchNavigation": true, "loop": false, "zoomable": true, "draggable": true, "openEffect": "zoom", "closeEffect": "zoom", "slideEffect": "slide"});
- document$.subscribe(() => { lightbox.reload() });
- </script></body>
- </html>
|