Spaces:
Running
Running
Kunal Pai
commited on
Commit
·
03de09a
1
Parent(s):
58408af
Add base models for Employee agents
Browse files- paper/conference_101719.tex +1 -0
- paper/references.bib +60 -0
paper/conference_101719.tex
CHANGED
@@ -119,6 +119,7 @@ The system uses a two-tiered hierarchy:
|
|
119 |
\item Task Execution: Receive task, execute, return result.
|
120 |
\item Resource Consumption: Associated costs (API, memory) tracked by system.
|
121 |
\end{itemize}
|
|
|
122 |
\end{itemize}
|
123 |
This hierarchy facilitates task decomposition and result aggregation; the dynamic pool provides flexibility.
|
124 |
|
|
|
119 |
\item Task Execution: Receive task, execute, return result.
|
120 |
\item Resource Consumption: Associated costs (API, memory) tracked by system.
|
121 |
\end{itemize}
|
122 |
+
Specialized employee agents are constructed using base models such as Mistral~7B~\cite{jiang2023mistral}, Llama~3~\cite{llama3herd}, Gemini~1.5~\cite{gemini1.5_report}, Qwen2.5~\cite{qwen2.5_report}, Qwen3~\cite{qwen3_blog}, and DeepSeek-R1~\cite{deepseekr1_report}, with the CEO agent configuring them via tailored system prompts.
|
123 |
\end{itemize}
|
124 |
This hierarchy facilitates task decomposition and result aggregation; the dynamic pool provides flexibility.
|
125 |
|
paper/references.bib
CHANGED
@@ -394,3 +394,63 @@
|
|
394 |
url={https://arxiv.org/abs/2407.03978},
|
395 |
}
|
396 |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
394 |
url={https://arxiv.org/abs/2407.03978},
|
395 |
}
|
396 |
|
397 |
+
@article{jiang2023mistral,
|
398 |
+
title={{Mistral 7B}},
|
399 |
+
author={Jiang, Albert Q and Xu, Alexandre and Lachaux, Arthur Mensch Guillaume Lample Nicol{\`a}s and Rozenberg, Fran{\c{c}}ois and Lacroix, Timoth{\'e}e and Lavril, Thibaut and Gaddipati, Teven Le Scao Eleonora and Ortiz, Lucile Saulnier Lixin and Tang, Dieuwke Hiemstra L{\'e}lio Renard and others},
|
400 |
+
year={2023},
|
401 |
+
eprint={2310.06825},
|
402 |
+
archivePrefix={arXiv},
|
403 |
+
primaryClass={cs.CL},
|
404 |
+
url={https://arxiv.org/abs/2310.06825},
|
405 |
+
}
|
406 |
+
|
407 |
+
@article{llama3herd,
|
408 |
+
title={{The Llama 3 Herd of Models}},
|
409 |
+
author={{Meta Llama Team}},
|
410 |
+
year={2024},
|
411 |
+
eprint={2407.21783},
|
412 |
+
archivePrefix={arXiv},
|
413 |
+
primaryClass={cs.CL},
|
414 |
+
url={https://arxiv.org/abs/2407.21783},
|
415 |
+
note={arXiv:2407.21783}
|
416 |
+
}
|
417 |
+
|
418 |
+
@article{gemini1.5_report,
|
419 |
+
title={{Gemini 1.5: Unlocking multimodal understanding across millions of tokens of context}},
|
420 |
+
author={{Gemini Team}},
|
421 |
+
year={2024},
|
422 |
+
eprint={2403.05530},
|
423 |
+
archivePrefix={arXiv},
|
424 |
+
primaryClass={cs.CL},
|
425 |
+
url={https://arxiv.org/abs/2403.05530},
|
426 |
+
note={arXiv:2403.05530}
|
427 |
+
}
|
428 |
+
|
429 |
+
@article{qwen2.5_report,
|
430 |
+
title={{Qwen2.5 Technical Report}},
|
431 |
+
author={{Qwen Team} and Yang, An and others},
|
432 |
+
year={2024},
|
433 |
+
eprint={2412.15115},
|
434 |
+
archivePrefix={arXiv},
|
435 |
+
primaryClass={cs.CL},
|
436 |
+
url={https://arxiv.org/abs/2412.15115},
|
437 |
+
note={arXiv:2412.15115}
|
438 |
+
}
|
439 |
+
|
440 |
+
@misc{qwen3_blog,
|
441 |
+
title={{Qwen3: Think Deeper, Act Faster}},
|
442 |
+
author={{Qwen Team}},
|
443 |
+
howpublished={\url{https://qwenlm.github.io/blog/qwen3/}},
|
444 |
+
year={2025}
|
445 |
+
}
|
446 |
+
|
447 |
+
@article{deepseekr1_report,
|
448 |
+
title={{DeepSeek-R1: Incentivizing Reasoning Capability in LLMs via Reinforcement Learning}},
|
449 |
+
author={{DeepSeek-AI and others}},
|
450 |
+
year={2025},
|
451 |
+
eprint={2501.12948},
|
452 |
+
archivePrefix={arXiv},
|
453 |
+
primaryClass={cs.CL},
|
454 |
+
url={https://arxiv.org/abs/2501.12948},
|
455 |
+
note={arXiv:2501.12948}
|
456 |
+
}
|