26:["$","$L2f",null,{"data":{"isPreview":true,"seq":1612805,"episode":{"Id":"708b6426d31e51d54cb553802a900e9c762ac9ac48071a3dac42ff08989388c6","Seq":1612805,"PodId":"2d4f05aac4d528e40e954452346d5021f1ab57bc06cca986eb689df8c034ea98","PodSeq":9417,"Title":"Meta-Rewarding Language Models: Self-Improving Alignment with LLM-as-a-Meta-Judge","PodName":"Arxiv Papers","Description":"

The paper introduces a Meta-Rewarding mechanism for LLMs, enhancing their self-judgment capabilities, leading to significant performance improvements without relying on human data.

https://arxiv.org/abs//2407.19594

YouTube: https://www.youtube.com/@ArxivPapers

TikTok: https://www.tiktok.com/@arxiv_papers

Apple Podcasts: https://podcasts.apple.com/us/podcast/arxiv-papers/id1692476016

Spotify: https://podcasters.spotify.com/pod/show/arxiv-papers

\n\n--- \n\nSupport this podcast: https://podcasters.spotify.com/pod/show/arxiv-papers/support","Url":"https://podcasters.spotify.com/pod/show/arxiv-papers/episodes/Meta-Rewarding-Language-Models-Self-Improving-Alignment-with-LLM-as-a-Meta-Judge-e2mpqut","Link":"https://anchor.fm/s/e3d903bc/podcast/play/90024349/https%3A%2F%2Fd3ctxlq1ktw2nl.cloudfront.net%2Fstaging%2F2024-7-4%2F599c8f09-a79b-8b0b-2f3a-535da4de5385.mp3","LinkType":"mp3","PublishTime":"$D2024-08-04T02:15:08.000Z","Img":"https://d3t3ozftmdmh3i.cloudfront.net/staging/podcast_uploaded_nologo/38126503/38126503-1686696647986-c72655f5033ff.jpg","EpImg":"https://d3t3ozftmdmh3i.cloudfront.net/staging/podcast_uploaded_nologo/38126503/38126503-1686696647986-c72655f5033ff.jpg","Duration":"00:22:41","Language":null,"SampleDuration":null,"IsVBR":false,"Transcribed":false,"Indexed":1,"Deleted":false,"RedirectSeq":null,"Source":null,"Size":null},"prevAndNext":{"prevSeq":1612804,"nextSeq":1612766},"states":{"state":"not-login","extra":{"summary":"Arxiv Papers - Meta-Rewarding Language Models: Self-Improving Alignment with LLM-as-a-Meta-Judge","previewContent":{"summary":"Arxiv Papers - Meta-Rewarding Language Models: Self-Improving Alignment with LLM-as-a-Meta-Judge","chapters":[],"keywords":[],"highlights":[],"transcripts":[]}}}}}]