AgentArgs
AgentArgs.set_benchmark()
AgentArgs.set_reproducibility_mode()
AXTree
ActionFlags
ActionFlags.action_set
ActionFlags.individual_examples
ActionFlags.is_strict
ActionFlags.long_description
ActionFlags.multi_actions
ActionPrompt
BeCautious
ChatInstructions
Error
Flags
Flags.asdict()
Flags.copy()
Flags.from_dict()
FocusedElement
GoalInstructions
HTML
Hints
History
History.shrink()
HistoryStep
HistoryStep.shrink()
MacNote
ObsFlags
ObsFlags.use_html
ObsFlags.use_ax_tree
ObsFlags.use_focused_element
ObsFlags.use_error_logs
ObsFlags.use_history
ObsFlags.use_past_error_logs
ObsFlags.use_action_history
ObsFlags.use_think_history
ObsFlags.use_diff
ObsFlags.html_type
ObsFlags.use_screenshot
ObsFlags.use_som
ObsFlags.extract_visible_tag
ObsFlags.extract_clickable_tag
ObsFlags.extract_coords
ObsFlags.filter_visible_elements_only
ObsFlags.filter_som_only
ObsFlags.filter_with_bid_only
ObsFlags.openai_vision_detail
ObsFlags.use_tabs
Observation
Observation.add_screenshot()
Observation.shrink()
PromptElement
PromptElement.abstract_ex
PromptElement.concrete_ex
PromptElement.is_visible
PromptElement.parse_answer()
PromptElement.prompt
Shrinkable
Shrinkable.shrink()
SystemPrompt
Tabs
Think
Trunkater
Trunkater.shrink()
fit_tokens()
make_obs_preprocessor()
GenericAgent
GenericAgent.get_action()
GenericAgent.obs_preprocessor()
GenericAgent.reset()
GenericAgentArgs
GenericAgentArgs.chat_model_args
GenericAgentArgs.close()
GenericAgentArgs.flags
GenericAgentArgs.make_agent()
GenericAgentArgs.max_retry
GenericAgentArgs.prepare()
GenericAgentArgs.set_benchmark()
GenericAgentArgs.set_reproducibility_mode()
get_action_post_hoc()
Criticise
GenericPromptFlags
GenericPromptFlags.use_plan
GenericPromptFlags.use_criticise
GenericPromptFlags.use_thinking
GenericPromptFlags.use_concrete_example
GenericPromptFlags.use_abstract_example
GenericPromptFlags.use_hints
GenericPromptFlags.enable_chat
GenericPromptFlags.max_prompt_tokens
GenericPromptFlags.be_cautious
GenericPromptFlags.extra_instructions
GenericPromptFlags.add_missparsed_messages
GenericPromptFlags.flag_group
GenericPromptFlags.action
GenericPromptFlags.max_trunc_itr
GenericPromptFlags.obs
GenericPromptFlags.use_memory
MainPrompt
MainPrompt.shrink()
Memory
Plan
ReproAgent
ReproAgent.get_action()
ReproAgentArgs
ReproAgentArgs.make_agent()
ReproChatModel
ReproChatModel.get_stats()
make_repro_agent()
reproduce_study()
get_base_agent()
get_som_agent()
get_vision_agent()
MostBasicAgent
MostBasicAgent.get_action()
MostBasicAgentArgs
MostBasicAgentArgs.agent_name
MostBasicAgentArgs.chat_model_args
MostBasicAgentArgs.close()
MostBasicAgentArgs.make_agent()
MostBasicAgentArgs.prepare()
MostBasicAgentArgs.set_reproducibility_mode()
MostBasicAgentArgs.temperature
MostBasicAgentArgs.use_chain_of_thought
experiment_config()
VisualWebArenaAgent
VisualWebArenaAgent.get_action()
VisualWebArenaAgentArgs
VisualWebArenaAgentArgs.action_set_args
VisualWebArenaAgentArgs.agent_name
VisualWebArenaAgentArgs.chat_model_args
VisualWebArenaAgentArgs.close()
VisualWebArenaAgentArgs.make_agent()
VisualWebArenaAgentArgs.observation_type
VisualWebArenaAgentArgs.prepare()
VisualWebArenaAgentArgs.set_benchmark()
VisualWebArenaAgentArgs.set_reproducibility_mode()
VisualWebArenaAgentArgs.temperature
VisualWebArenaAgentArgs.with_few_shot_examples
image_data_to_uri()
parser()
ClickMapper
ClickMapper.to_step()
ClickMapper.to_time()
EpisodeId
EpisodeId.agent_id
EpisodeId.seed
EpisodeId.task_name
Info
Info.active_tab
Info.agent_df
Info.agent_id_keys
Info.click_mapper
Info.exp_list_dir
Info.exp_result
Info.filter_agent_id()
Info.get_agent_id()
Info.result_df
Info.results_dir
Info.step
Info.tasks_df
Info.update_exp_result()
StepId
StepId.episode_id
StepId.step
add_patch()
clean_column_names()
code()
display_table()
fig_to_pil()
format_constant_and_variables()
gallery_step_change()
generate_profiling()
get_action_info()
get_agent_report()
get_directory_contents()
get_episode_info()
get_obs()
get_screenshot()
get_seeds_df()
get_state_error()
if_active()
main()
most_recent_folder()
new_agent_id()
new_episode()
new_exp_dir()
on_select_agent()
on_select_seed()
on_select_task()
plot_profiling()
refresh_exp_dir_choices()
remove_args_from_col()
run_gradio()
select_step()
submit_action()
tab_select()
update_agent_info_html()
update_agent_info_md()
update_axtree()
update_chat_messages()
update_error_report()
update_global_stats()
update_html()
update_logs()
update_prompt_tests()
update_pruned_html()
update_screenshot()
update_screenshot_gallery()
update_screenshot_pair()
update_seeds()
update_stats()
update_step_info()
update_task_error()
ablation_report()
categorize_error()
display_report()
error_report()
error_report_detailed()
flag_report()
get_all_summaries()
get_all_task_messages()
get_constants_and_variables()
get_sample_std_err()
get_std_err()
get_study_summary()
global_report()
load_result_df()
map_err_key()
print_errors_chronologically()
reduce_episodes()
report_2d()
report_constant_and_variables()
report_different_errors()
set_index_from_variables()
set_wrap_style()
shrink_columns()
split_by_key()
summarize()
summarize_stats()
summarize_study()
AbstractChatModel
AbstractChatModel.get_stats()
BaseModelArgs
BaseModelArgs.close_server()
BaseModelArgs.make_model()
BaseModelArgs.max_input_tokens
BaseModelArgs.max_new_tokens
BaseModelArgs.max_total_tokens
BaseModelArgs.model_name
BaseModelArgs.prepare_server()
BaseModelArgs.temperature
BaseModelArgs.vision_support
AzureChatModel
AzureModelArgs
AzureModelArgs.deployment_name
AzureModelArgs.make_model()
ChatModel
ChatModel.get_stats()
ChatModelArgs
ChatModelArgs.extra_tgi_args
ChatModelArgs.hf_hosted
ChatModelArgs.infer_tokens_length
ChatModelArgs.info
ChatModelArgs.is_model_operational
ChatModelArgs.make_model()
ChatModelArgs.model_path
ChatModelArgs.model_size
ChatModelArgs.model_url
ChatModelArgs.n_retry_server
ChatModelArgs.shard_support
ChatModelArgs.sliding_window
ChatModelArgs.tgi_image
ChatModelArgs.training_total_tokens
ChatModelArgs.vision_support
CheatMiniWoBLLM
CheatMiniWoBLLMArgs
CheatMiniWoBLLMArgs.close_server()
CheatMiniWoBLLMArgs.make_model()
CheatMiniWoBLLMArgs.max_input_tokens
CheatMiniWoBLLMArgs.max_new_tokens
CheatMiniWoBLLMArgs.max_total_tokens
CheatMiniWoBLLMArgs.model_name
CheatMiniWoBLLMArgs.prepare_server()
CheatMiniWoBLLMArgs.wait_time
HuggingFaceURLChatModel
OpenAIChatModel
OpenAIModelArgs
OpenAIModelArgs.make_model()
OpenRouterChatModel
OpenRouterError
OpenRouterModelArgs
OpenRouterModelArgs.make_model()
RetryError
SelfHostedModelArgs
SelfHostedModelArgs.backend
SelfHostedModelArgs.make_model()
SelfHostedModelArgs.model_url
SelfHostedModelArgs.n_retry_server
SelfHostedModelArgs.token
handle_error()
make_assistant_message()
make_system_message()
make_user_message()
HFBaseChatModel
HFBaseChatModel.llm
HFBaseChatModel.prompt_template
HFBaseChatModel.tokenizer
HFBaseChatModel.n_retry_server
AIMessage
BaseMessage
BaseMessage.add_content()
BaseMessage.add_image()
BaseMessage.add_text()
BaseMessage.merge()
BaseMessage.to_markdown()
Discussion
Discussion.add_content()
Discussion.add_image()
Discussion.add_message()
Discussion.add_text()
Discussion.append()
Discussion.last_message
Discussion.merge()
Discussion.to_markdown()
Discussion.to_openai()
Discussion.to_string()
HumanMessage
ParseError
SystemMessage
compress_string()
count_tokens()
download_and_save_model()
extract_code_blocks()
extract_html_tags()
get_tokenizer()
get_tokenizer_old()
image_to_jpg_base64_url()
json_parser()
messages_to_dict()
parse_html_tags()
parse_html_tags_raise()
retry()
retry_multiple()
truncate_tokens()
yaml_parser()
PromptTemplate
PromptTemplate.ai
PromptTemplate.construct_prompt()
PromptTemplate.format_message()
PromptTemplate.human
PromptTemplate.prompt_end
PromptTemplate.system
get_prompt_template()
LLMTracker
LLMTracker.add_tracker()
LLMTracker.stats
cost_tracker_decorator()
get_pricing_openai()
get_pricing_openrouter()
set_tracker()
Choice
Choice.sample()
CrossProd
Distribution
Distribution.sample()
Toggle
expand_cross_product()
make_ablation_study()
make_progression_study()
sample_and_expand_cross_product()
sample_args()
MockedExpArgs
MockedExpArgs.run()
add_dependencies()
hide_some_exp()
make_seeds()
order()
run_exp()
timeout_manager()
execute_task_graph()
get_elapsed_time()
poll_for_timeout()
find_incomplete()
import_object()
non_dummy_count()
noop()
run_experiments()
BaseServer
BaseServer.init()
WebArenaInstanceVars
WebArenaInstanceVars.base_url
WebArenaInstanceVars.clone()
WebArenaInstanceVars.from_env_vars()
WebArenaInstanceVars.full_reset
WebArenaInstanceVars.gitlab
WebArenaInstanceVars.homepage
WebArenaInstanceVars.init()
WebArenaInstanceVars.make_env_vars()
WebArenaInstanceVars.map
WebArenaInstanceVars.module_name
WebArenaInstanceVars.prefix
WebArenaInstanceVars.reddit
WebArenaInstanceVars.shopping
WebArenaInstanceVars.shopping_admin
WebArenaInstanceVars.wikipedia
unimport_modules()
append_to_journal()
assert_compatible()
get_reproducibility_info()
AbstractStudy
AbstractStudy.dir
AbstractStudy.find_incomplete()
AbstractStudy.get_results()
AbstractStudy.make_dir()
AbstractStudy.run()
AbstractStudy.save()
AbstractStudy.shuffle_exps()
AbstractStudy.suffix
ParallelStudies
ParallelStudies.parallel_servers
ParallelStudies_alt
ParallelStudies_alt.parallel_servers
SequentialStudies
SequentialStudies.append_to_journal()
SequentialStudies.find_incomplete()
SequentialStudies.name
SequentialStudies.override_max_steps()
SequentialStudies.run()
SequentialStudies.studies
Study
Study.agent_args
Study.benchmark
Study.dir
Study.suffix
Study.uuid
Study.reproducibility_info
Study.logging_level
Study.logging_level_stdout
Study.comment
Study.ignore_dependencies
Study.avg_step_timeout
Study.demo_mode
Study.append_to_journal()
Study.find_incomplete()
Study.load()
Study.load_exp_args_list()
Study.load_most_recent()
Study.make_exp_args_list()
Study.name
Study.override_max_steps()
Study.run()
Study.set_reproducibility_info()
get_most_recent_study()
make_study()
set_demo_mode()
clean_dict()
compress_chains()
compress_sequential_chains()
dict_to_networkx()
plot_components_grid()
plot_graph()
make_exp_args()