Add new talk

This commit is contained in:
rfl 2025-06-15 18:34:11 +02:00
parent b7eaf80617
commit 8272a1639e
Signed by: rfl
GPG key ID: 48B0E5DDF8FA62EF
4 changed files with 327 additions and 0 deletions

View file

@ -0,0 +1,64 @@
@misc{metr2025,
author = {METR},
title = {Measuring AI Ability to Complete Long Tasks},
year = {2025},
url = {https://metr.org/blog/2025-03-19-measuring-ai-ability-to-complete-long-tasks/}
}
@article{acl2024,
author = {Author(s) of ACL Paper}, % Replace with actual author(s)
title = {PowerPoint Task Completion: Evaluating LLMs on Multi-Turn, Multi-Modal Instructions},
year = {2024},
journal = {Findings of the Association for Computational Linguistics},
note = {ACL 2024},
url = {https://aclanthology.org/2024.findings-acl.514.pdf}
}
@misc{gorilla,
author = {Gorilla Team},
title = {Gorilla APIBench Leaderboard},
year = {2025},
url = {https://gorilla.cs.berkeley.edu/leaderboard.html}
}
@misc{aider,
author = {Aider Team},
title = {Aider.chat Leaderboards},
year = {2025},
url = {https://aider.chat/docs/leaderboards/}
}
@misc{metaculus,
author = {Metaculus},
title = {Metaculus: AI Prediction Markets},
year = {2025},
url = {https://www.metaculus.com/questions/?topic=ai}
}
@misc{predictit,
author = {PredictIt},
title = {PredictIt Markets},
year = {2025},
url = {https://www.predictit.org/}
}
@misc{polymarket,
author = {Polymarket},
title = {Polymarket: AI Markets},
year = {2025},
url = {https://polymarket.com/markets/all/ai}
}
@techreport{aisafety,
author = {International AI Safety Report Team},
title = {International AI Safety Report},
year = {2025},
institution = {International AI Safety Report},
url = {https://arxiv.org/abs/2501.17805}
}
@misc{trackingai,
author = {TrackingAI Team},
title = {TrackingAI.org},
year = {2025},
url = {https://trackingai.org/home}
}