@@ -68,16 +68,15 @@ python -u -m agentq
68
68
69
69
### generate dpo pairs for RL
70
70
71
- ```` bash
71
+ ``` bash
72
72
python -m agentq.core.mcts.browser_mcts
73
73
```
74
74
75
75
#### citations
76
76
77
77
a bunch of amazing work in the space has inspired this.
78
78
79
- ````
80
-
79
+ ```
81
80
@misc{putta2024agentqadvancedreasoning,
82
81
title={Agent Q: Advanced Reasoning and Learning for Autonomous AI Agents},
83
82
author={Pranav Putta and Edmund Mills and Naman Garg and Sumeet Motwani and Chelsea Finn and Divyansh Garg and Rafael Rafailov},
@@ -87,8 +86,8 @@ archivePrefix={arXiv},
87
86
primaryClass={cs.AI},
88
87
url={https://arxiv.org/abs/2408.07199},
89
88
}
90
-
91
89
```
90
+
92
91
```
93
92
@inproceedings{yao2022webshop,
94
93
bibtex_show = {true},
@@ -102,18 +101,15 @@ url={https://arxiv.org/abs/2408.07199},
102
101
```
103
102
104
103
```
105
-
106
104
@article{he2024webvoyager,
107
105
title={WebVoyager: Building an End-to-End Web Agent with Large Multimodal Models},
108
106
author={He, Hongliang and Yao, Wenlin and Ma, Kaixin and Yu, Wenhao and Dai, Yong and Zhang, Hongming and Lan, Zhenzhong and Yu, Dong},
109
107
journal={arXiv preprint arXiv:2401.13919},
110
108
year={2024}
111
109
}
112
-
113
110
```
114
111
115
112
```
116
-
117
113
@misc{abuelsaad2024-agente,
118
114
title={Agent-E: From Autonomous Web Navigation to Foundational Design Principles in Agentic Systems},
119
115
author={Tamer Abuelsaad and Deepak Akkil and Prasenjit Dey and Ashish Jagmohan and Aditya Vempaty and Ravi Kokku},
@@ -123,11 +119,4 @@ archivePrefix={arXiv},
123
119
primaryClass={cs.AI},
124
120
url={https://arxiv.org/abs/2407.13032},
125
121
}
126
-
127
- ```
128
-
129
- ```
130
-
131
- ```
132
-
133
122
```
0 commit comments