agbenchmark/README.md,sha256=D1lbbIgcFxpJ6bXCO9-vTLTWMKArtWB5uS_Ii4Kd7LI,2780
agbenchmark/ReportManager.py,sha256=PyOzUP11zXMrow-Wcx_Vl2KzJ1vvXgyKt_zNZDlA7Yw,2336
agbenchmark/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
agbenchmark/agent_interface.py,sha256=sgY3dw6Ux94ziYOUSFw6VvF99yypvZm6F7x_Yd41FB0,2530
agbenchmark/challenge.py,sha256=KMp5WQGZrKsIcINpFZa7CaF-wyqhS7eReKSM_HBrSZs,5140
agbenchmark/challenges/README.md,sha256=FTTMVGOsO2nI4IZtsXE9pOrPBnp3m_FSFE9c5ylUF_c,2581
agbenchmark/challenges/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
agbenchmark/challenges/code/d1_debug/artifacts_in/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
agbenchmark/challenges/code/d1_debug/artifacts_in/code.py,sha256=Y2yG7-fob5yIBNp1x5mlzbAXlrSYKT_B1oerkPZAvwI,325
agbenchmark/challenges/code/d1_debug/artifacts_in/test.py,sha256=1U0zbxA2LNEuVHsBnuMeW2-wbYifcG9-bjjpvaNp-vY,893
agbenchmark/challenges/code/d1_debug/artifacts_out/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
agbenchmark/challenges/code/d1_debug/artifacts_out/code.py,sha256=mgEL1hA8gPm3ABq_RhVC8_dSDW-DlVYYTAOpERlKk0g,312
agbenchmark/challenges/code/d1_debug/artifacts_out/test.py,sha256=1U0zbxA2LNEuVHsBnuMeW2-wbYifcG9-bjjpvaNp-vY,893
agbenchmark/challenges/code/d1_debug/data.json,sha256=u8E-VQXKvIbpGzJ8JiNalh7_Y_3l44pW_Q91by0wlP4,645
agbenchmark/challenges/code/d2_vague/artifacts_in/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
agbenchmark/challenges/code/d2_vague/artifacts_in/code.py,sha256=Y2yG7-fob5yIBNp1x5mlzbAXlrSYKT_B1oerkPZAvwI,325
agbenchmark/challenges/code/d2_vague/artifacts_in/test.py,sha256=1U0zbxA2LNEuVHsBnuMeW2-wbYifcG9-bjjpvaNp-vY,893
agbenchmark/challenges/code/d2_vague/artifacts_out/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
agbenchmark/challenges/code/d2_vague/artifacts_out/code.py,sha256=mgEL1hA8gPm3ABq_RhVC8_dSDW-DlVYYTAOpERlKk0g,312
agbenchmark/challenges/code/d2_vague/artifacts_out/test.py,sha256=1U0zbxA2LNEuVHsBnuMeW2-wbYifcG9-bjjpvaNp-vY,893
agbenchmark/challenges/code/d2_vague/data.json,sha256=ZfktefY7jUN4bUfyTEIrnPx-rnrbdPIISqQNzjQcptQ,612
agbenchmark/challenges/code/d3_two_sum/artifacts_out/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
agbenchmark/challenges/code/d3_two_sum/artifacts_out/code.py,sha256=mgEL1hA8gPm3ABq_RhVC8_dSDW-DlVYYTAOpERlKk0g,312
agbenchmark/challenges/code/d3_two_sum/custom_python/test.py,sha256=1U0zbxA2LNEuVHsBnuMeW2-wbYifcG9-bjjpvaNp-vY,893
agbenchmark/challenges/code/d3_two_sum/data.json,sha256=bN7B1-_GtN7ZOKH16bjkGK60JkPqsonWSpQHMzEG284,869
agbenchmark/challenges/code/d4_web_server/custom_python/api_tests.py,sha256=iMQrUa1oYE-vr_EbeTk_nLKjPZ9POYF1jNT7F1AbUqk,1171
agbenchmark/challenges/code/d4_web_server/data.json,sha256=kJ05dwV3wyOsXxEE0am4decRuF8R-eO6ukBY2LPjkdI,757
agbenchmark/challenges/code/d5_three_sum/artifacts_out/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
agbenchmark/challenges/code/d5_three_sum/artifacts_out/code.py,sha256=7WIWYXHzGB6358P__XvOeOxK83GeOMapGL1FG-1ikaU,809
agbenchmark/challenges/code/d5_three_sum/custom_python/test.py,sha256=gbT4bj6oVNiQBkhVYaxWr2dNJtRW39Y4GHNeUbt4pSM,921
agbenchmark/challenges/code/d5_three_sum/data.json,sha256=Ffqjd9l4PEoRlZi9BDKhFithTUZqt97kyZF5TE--Bpk,933
agbenchmark/challenges/define_task_types.py,sha256=kYdg4Z6fRW1WiD5NYsqYF2KnSs6hNQGPg3WRhi0cke0,2076
agbenchmark/challenges/interface/read_file/artifacts_in/file_to_check.txt,sha256=A7ogTlDRJuRnTABeBNguhMITZngK8fQ71Uo3gWtqs0A,13
agbenchmark/challenges/interface/read_file/artifacts_out/file_to_check.txt,sha256=Qmpa2TwVaYN6Zk-7DIg6ZUt6knls324ht3AL-Cge-IU,27
agbenchmark/challenges/interface/read_file/data.json,sha256=Ue0dhxj8LjaIBAb1CQouZsAGyw9-8VPwl74VDBi1x2U,517
agbenchmark/challenges/interface/search/artifacts_out/random_file.txt,sha256=GC3T1SMUqdw8VUrUFJA7B-x2U9ltyOFsYA1VSprESLg,38
agbenchmark/challenges/interface/search/data.json,sha256=jDC9vuDLazZGY-b6P9jKoGmCtjba4Xgl4EL5E3racNw,547
agbenchmark/challenges/interface/write_file/artifacts_out/random_file.txt,sha256=XfgOVJWOZ1Fyv7_tBMuTjmo0egi8UJj7hKocXjoVNSE,11
agbenchmark/challenges/interface/write_file/data.json,sha256=UAEmcKCCJsvGQf0y5GVaiPqihnzL2riBOpzKKSBHtVw,519
agbenchmark/challenges/memory/m1_id/artifacts_in/instructions_1.txt,sha256=KbEhoojak7uF5aL256sewRK_V_ln42ACQfasZV7V8ks,60
agbenchmark/challenges/memory/m1_id/artifacts_in/instructions_2.txt,sha256=PJRIJGe4xbPXTYVMocv1i2T5eCaQRbkdNLgG9m5H720,33
agbenchmark/challenges/memory/m1_id/artifacts_in/instructions_3.txt,sha256=hykrjTjIqNLoCI6wEyDBXuFyquiQtDe5X6rI5RBPBho,33
agbenchmark/challenges/memory/m1_id/artifacts_in/instructions_4.txt,sha256=SLVu3D2Z0HDTgss4p9Th933ihTYLRLOz_c1E2Lk7d8w,33
agbenchmark/challenges/memory/m1_id/artifacts_in/instructions_5.txt,sha256=xZPF8_zMPalLDAc2dln4oT2J9_t8KlnpqttiM7VLkA0,63
agbenchmark/challenges/memory/m1_id/artifacts_out/result.txt,sha256=5DhCthi52lMSFHo7-G59vr9AukCpFH4zZHvR380AVrc,5
agbenchmark/challenges/memory/m1_id/data.json,sha256=ZQ6KU8foB9LVl9ni3grkFh-AjJKvj39T7uTHgE2n5Dk,598
agbenchmark/challenges/memory/m2_multiple/artifacts_in/instructions_1.txt,sha256=rJREbJdY6-w_XM1EAUL3JVqG3KoNbjK6eOvGRMOb5Eo,62
agbenchmark/challenges/memory/m2_multiple/artifacts_in/instructions_2.txt,sha256=cMJFo1SFDdzKJtpNhW7wztH8ncqdP8xtBgKAlYLyP-Q,62
agbenchmark/challenges/memory/m2_multiple/artifacts_in/instructions_3.txt,sha256=EvkPdHm4JaSsyZ4id9Jgn5m0s8nIOZa96KZo1a2M22g,62
agbenchmark/challenges/memory/m2_multiple/artifacts_in/instructions_4.txt,sha256=eF5Fra1cFOFRa9pSuub9U-dC2SuyKZVrkohAerkRvfg,62
agbenchmark/challenges/memory/m2_multiple/artifacts_in/instructions_5.txt,sha256=4dk-YYBCUMHBva4GZxUd8lkbg3JlGUUw6N8FPFPvQRM,64
agbenchmark/challenges/memory/m2_multiple/artifacts_out/result.txt,sha256=8AyRpnUxGE9YsHwLonUEcX4M8xIl1dGOzKqtD_Fey-0,20
agbenchmark/challenges/memory/m2_multiple/data.json,sha256=FoYwrWmR0FEvgge-1LkLF-mZTcwfoLlgQw5CZ2oM0kI,667
agbenchmark/challenges/memory/m3_noise/artifacts_in/instructions_1.txt,sha256=bsHwHIS3gS6zIe7QMZFoYImIrWtnfEnYz6DwH2wtBYM,1066
agbenchmark/challenges/memory/m3_noise/artifacts_in/instructions_2.txt,sha256=98u6vRuPLTl1R6Y47rqoeBjhl3TeOPl8wnBPduDLb0Y,1066
agbenchmark/challenges/memory/m3_noise/artifacts_in/instructions_3.txt,sha256=Bc6tYrP6_p0q7SkwYmL5xiY1ZDfVLRt0GEEh6EQyT9U,1066
agbenchmark/challenges/memory/m3_noise/artifacts_in/instructions_4.txt,sha256=_7_ZsUpJBijRo8nO8ASdwfRbpWXh58rCZH1baz93wDw,1066
agbenchmark/challenges/memory/m3_noise/artifacts_in/instructions_5.txt,sha256=x0cO-tlHqFssNeOfvYcUg3GqQJcal2seUNOjFCFMHUc,1068
agbenchmark/challenges/memory/m3_noise/artifacts_out/result.txt,sha256=8AyRpnUxGE9YsHwLonUEcX4M8xIl1dGOzKqtD_Fey-0,20
agbenchmark/challenges/memory/m3_noise/data.json,sha256=pdoPlLjjhxovqryKv2OsQJ3rAWazJ_ZYrffU4e6OhZU,774
agbenchmark/challenges/memory/m4_phrases/artifacts_in/instructions_1.txt,sha256=ado2S-u85HWt2uOKZZnsawLcU1gZJ8qOTq9BKd5GGmc,1127
agbenchmark/challenges/memory/m4_phrases/artifacts_in/instructions_2.txt,sha256=WpyCDMvWkqtSIRWGfjDguPAA--hIiRsTPqrFaH_86nA,1124
agbenchmark/challenges/memory/m4_phrases/artifacts_in/instructions_3.txt,sha256=uZ2lMnS8Xs0Q-Ay534hgz4TUi2pCcmho50k6m5SxX2U,1117
agbenchmark/challenges/memory/m4_phrases/artifacts_in/instructions_4.txt,sha256=vKMkA0e8_vpe8w-SjI47zgDTp68IR2XGgy9nxARfd14,1126
agbenchmark/challenges/memory/m4_phrases/artifacts_in/instructions_5.txt,sha256=LPLLI6E_foe0y88HdcomK48ICjHjp85l6IJ2GAu6wVI,1072
agbenchmark/challenges/memory/m4_phrases/artifacts_out/result.txt,sha256=a8gcVHiMXE-42Scrp0yfoyQPHFAANHCqsL8tUKH6G4o,226
agbenchmark/challenges/memory/m4_phrases/data.json,sha256=Uw25gD87i31BmtjQFyx4qlqrcEruGBAvpmZ56KF64U4,1234
agbenchmark/challenges/retrieval/r1_book_price/artifacts_out/random_file.txt,sha256=S-0qJWMjiFn6wz6BMchWL3g50XMaWxsn-sUEBGQ0wlk,6
agbenchmark/challenges/retrieval/r1_book_price/data.json,sha256=Q5X3giXuVnZmoeZ3pJ7Z51TMpI48YXlgSSDIAadnD4g,555
agbenchmark/challenges/retrieval/r2.1_specific/artifacts_out/random_file.txt,sha256=iVQEyv_aA8zqwHzTXUTAQDOhic8Ha_Teudju2BOSoaU,16
agbenchmark/challenges/retrieval/r2.1_specific/data.json,sha256=pLaGU9SD4Rtt6gM-J7kO5KcWTgXXNrNfUkKS-_I50us,510
agbenchmark/challenges/retrieval/r2.2_formatting/artifacts_out/random_file.txt,sha256=iVQEyv_aA8zqwHzTXUTAQDOhic8Ha_Teudju2BOSoaU,16
agbenchmark/challenges/retrieval/r2.2_formatting/data.json,sha256=pS0jn0OQxod5s3FMQ1Tq97cMMB0CfvoNoMVOV3Nv5W8,678
agbenchmark/challenges/retrieval/r2_tesla_revenue/artifacts_out/random_file.txt,sha256=iVQEyv_aA8zqwHzTXUTAQDOhic8Ha_Teudju2BOSoaU,16
agbenchmark/challenges/retrieval/r2_tesla_revenue/data.json,sha256=wN-wQV1-NPUDsC-u7tRxjzdk0tVWiCmQD24bVtrOefU,473
agbenchmark/challenges/retrieval/r3/artifacts_out/random_file.txt,sha256=tSSkDboMTOBZNwaru9dJ1RDkIAMVG5H62fcwtkZQE-Q,220
agbenchmark/challenges/retrieval/r3/data.json,sha256=StFsnKlWz_cv4r2lBCTHmgLE9sBWYs8eQJ4VeKAGeiQ,1079
agbenchmark/challenges/test_all.py,sha256=sZV5v4L69mZiz6bfxdduR6SQHQwguGIQzRh1f2y3tvM,2317
agbenchmark/config.json,sha256=pkLpkq2447fyLM7iQaiHqGl1rlMZCEE2OQxWCKohjKE,61
agbenchmark/conftest.py,sha256=Zf_NxowMOELON0HBSj-sphRu1QaIMaJwvxbDqE30hto,9449
agbenchmark/metrics.py,sha256=Kslgd-61TNLa6qwK9Q8rkfI-rjhRa-ffQ9wFNBJXFHw,466
agbenchmark/regression_tests.json,sha256=o79hOPK8X0TCQVxmIFK1PHIu2o9SRZI-gHaaqeRJaPQ,1841
agbenchmark/reports/internal_info.json,sha256=KsLWhjyHqYp8Ltv5lsLTcckrYm1Qu614QembWuOtI7I,2706
agbenchmark/reports/mini-agi/1.1_TestWriteFile.json,sha256=c4D31d9x6s5rvx_ExGU5kTcTseME09Eb9QY2gXlwruo,648
agbenchmark/reports/mini-agi/10.1_TestRememberMultipleWithNoise.json,sha256=FH7MSMByQf_s8oA0STUZfCkrGpdW3GsbGeKAeZIBgPA,1086
agbenchmark/reports/mini-agi/10_TestRememberMultipleWithNoise.json,sha256=HOtSEwpAQM_nTu3IXeRAfZdBubprxT0lW2qpUaybz_U,1200
agbenchmark/reports/mini-agi/11.1_TestRememberMultiplePhrasesWithNoise.json,sha256=ERqxXbAzf-gK-805FQHZlHW8-4R2zJ1xDL5fS58aNPM,1444
agbenchmark/reports/mini-agi/11.2_TestRememberMultiplePhrasesWithNoise.json,sha256=pWTz_MuHeqxxO9ABb94-QEeQepfB2Z3Lyqus99c9ij4,1444
agbenchmark/reports/mini-agi/11.3_TestRememberMultiplePhrasesWithNoise.json,sha256=hYNr4oCtXFCafzLgrhsdaOkdJH97l4kgCVyAx3iWOmU,1444
agbenchmark/reports/mini-agi/11.4_TestRememberMultiplePhrasesWithNoise.json,sha256=y4Mk80bC6ly624ffQJkP8nKmIdmc2PzZNy_KPGeX8YA,1377
agbenchmark/reports/mini-agi/11.5_TestRememberMultiplePhrasesWithNoise.json,sha256=rQoHCBuwPiofAQn0-wUbl_ifdUSn25Bq4zHKNAqeC8E,1446
agbenchmark/reports/mini-agi/11_TestRememberMultiplePhrasesWithNoise.json,sha256=gyQ1QfJ8X6j_W4GcsYls5ydMj1ZShoVinVOdIF0dQDg,1444
agbenchmark/reports/mini-agi/12.1_TestDebugSimpleTypoWithGuidance.json,sha256=jhSa_xPOhLrmkq6tvwGvV4AFvUfypf9WmvJ2ry4Ggs8,1059
agbenchmark/reports/mini-agi/12.2_TestDebugSimpleTypoWithGuidance.json,sha256=jhTKVSgdClpgNMC04QkK9K9P094iyXs-hzlQMTC_4Nc,1060
agbenchmark/reports/mini-agi/12.3_TestDebugSimpleTypoWithGuidance.json,sha256=xIX3czSn59eU5RDA6fl-dnZPqnwVeDauM9QxLj47ugg,1066
agbenchmark/reports/mini-agi/12_TestDebugSimpleTypoWithGuidance.json,sha256=x_JfYKEhNa3Aaf6Ny9fS8pREseqMYDvsBoFKoDZ0I7U,980
agbenchmark/reports/mini-agi/1_TestWriteFIle.json,sha256=I_A_8dR_z9wCv_nXNp-1HGTxnyJjt69_R1amHG3cw0o,639
agbenchmark/reports/mini-agi/2.1_TestReadFile.json,sha256=PPU0De8x7e2Y9rB7i6v9JPz6bvCgvVVLRURnPUX0ucc,644
agbenchmark/reports/mini-agi/2_TestReadFile.json,sha256=EAquj8A5wbn8eH0MmVAEUZ9XrOC6eoPg36gIX9_0PnI,636
agbenchmark/reports/mini-agi/3.1_TestSearch.json,sha256=9i_2-qTGBCMgIGFJtvI96oI68kn3XTlVosPwNsr1ng8,638
agbenchmark/reports/mini-agi/3_TestSearch.json,sha256=6-lacMIp8DcVaVWPR8AaFyYlAcpkTKHxoPLYARQ7YUE,630
agbenchmark/reports/mini-agi/4.1_TestBasicRetrieval.json,sha256=6L86S2l2fHHM80ggYqm3Dvt0ABZtOdHOw2y2lrLPOsA,634
agbenchmark/reports/mini-agi/4_TestBasicRetrieval.json,sha256=ThmvvuY3UtkepB65b3J8F4WiXAqHjsJ6qtGycuH00Vw,641
agbenchmark/reports/mini-agi/5.1_TestRetrieval2.0.json,sha256=RUtu7VDKqZi3qJYdURiIaPV2wwCxT78KDgclzQRYM5Y,814
agbenchmark/reports/mini-agi/5_TestRetrieval2.0.json,sha256=gE2yW2SZvIICJzu81Kfqlw_R__RNqY4AOthY-Gcmmp0,753
agbenchmark/reports/mini-agi/6.1_TestRetrieval2.1.json,sha256=N4OmFRRkZqVvz5xrZi19IIz2D1JTuHpv_ps2Ive-L6I,841
agbenchmark/reports/mini-agi/6.2_TestRetrieval2.1.json,sha256=27AuiKsU-6y0rQmhw5pMBZQQPWdCltFQ90wTE4-tRFk,836
agbenchmark/reports/mini-agi/6.3_TestRetrieval2.1.json,sha256=Cm_mGX67dMLKbsichb647EYIcpE8s8HcbGSh_H3KUSY,836
agbenchmark/reports/mini-agi/6.4_TestRetrieval2.1.json,sha256=P9fAHvoxmF9UpKDnfLZ1lTg_YBLpYkSxObIo6qmLv7E,908
agbenchmark/reports/mini-agi/6_TestRetrieval2.1.json,sha256=zUmuNGzB7AZfEMqEFbnHolgfsNQuviG-mfjCqQr9okc,823
agbenchmark/reports/mini-agi/7.1_TestRetrieval2.2.json,sha256=BaJEUdbc5i0tz7j1_P1DIEk29u4tOvlM89sBnvAOcAI,1073
agbenchmark/reports/mini-agi/7_TestRetrieval2.2.json,sha256=zeFZP4JfXkj-SA3r4LgEH8SDTLTQMRzrTZdpzG-BQ-8,893
agbenchmark/reports/mini-agi/8.1_TestBasicMemory.json,sha256=AcmRu3BnE2NVYV2GmdPZTVDykXrc9F3rVQ5OLhf7kmw,908
agbenchmark/reports/mini-agi/8_TestBasicMemory.json,sha256=yDolZEfLuxF3l3FDPDirIkDbNA47Fcb1ZQ7dPN6B1VQ,1041
agbenchmark/reports/mini-agi/9.1_TestRememberMultipleIds.json,sha256=8EP5S-DMjo3xcMHs8gU9RuWOPuaNbA4SFREY7kzEnzM,982
agbenchmark/reports/mini-agi/9_TestRememberMultipleIds.json,sha256=FEo0G1nSgQ7tY79zhNtjRpr1Tcg9NvTdaer6JHgBt3U,1110
agbenchmark/start_benchmark.py,sha256=qKu_UmxLyz__r0ZkYutRrtuo7HLKzhD7ijr1NrnLnOg,3843
agbenchmark/utils.py,sha256=FozYtMV3paiTU_mhUz73jIg68SEP_By2r-F8rNrdAwI,6977
agbenchmark-0.0.1.dist-info/LICENSE,sha256=eeSqmvfdcXlIITNOsv-_AiuDrUzhxG-dIzCtgn8OzZI,1069
agbenchmark-0.0.1.dist-info/METADATA,sha256=XG-9N7HreTRMNVpXkhjpbuDKoRAs8zoa_mA8I_BESdc,2693
agbenchmark-0.0.1.dist-info/WHEEL,sha256=Zb28QaM1gQi8f4VCBhsUklF61CTlNYfs9YAZn-TOGFk,88
agbenchmark-0.0.1.dist-info/entry_points.txt,sha256=TrDUWFh9sn6-hqU5ENcL53OCPLDg8h9b0G4VxWl0HF0,63
agbenchmark-0.0.1.dist-info/RECORD,,
