<?xml version="1.0" encoding="UTF-8"?><rss version="2.0"
	xmlns:content="http://purl.org/rss/1.0/modules/content/"
	xmlns:wfw="http://wellformedweb.org/CommentAPI/"
	xmlns:dc="http://purl.org/dc/elements/1.1/"
	xmlns:atom="http://www.w3.org/2005/Atom"
	xmlns:sy="http://purl.org/rss/1.0/modules/syndication/"
	xmlns:slash="http://purl.org/rss/1.0/modules/slash/"
	>

<channel>
	<title>Chat Agent &#8211; Blog Sketch</title>
	<atom:link href="https://blog.ziaowang.top/tag/chat-agent/feed/" rel="self" type="application/rss+xml" />
	<link>https://blog.ziaowang.top</link>
	<description></description>
	<lastBuildDate>Sun, 08 Sep 2024 20:27:46 +0000</lastBuildDate>
	<language>en-US</language>
	<sy:updatePeriod>
	hourly	</sy:updatePeriod>
	<sy:updateFrequency>
	1	</sy:updateFrequency>
	<generator>https://wordpress.org/?v=6.8.5</generator>
	<item>
		<title>LLM + RLHF = Chat Agent</title>
		<link>https://blog.ziaowang.top/2024/06/16/llm-rlhf-chat-agent/</link>
					<comments>https://blog.ziaowang.top/2024/06/16/llm-rlhf-chat-agent/#respond</comments>
		
		<dc:creator><![CDATA[wponaws]]></dc:creator>
		<pubDate>Sun, 16 Jun 2024 03:28:16 +0000</pubDate>
				<category><![CDATA[Uncategorized]]></category>
		<category><![CDATA[Chat Agent]]></category>
		<category><![CDATA[OpenAI]]></category>
		<category><![CDATA[RLHF]]></category>
		<guid isPermaLink="false">http://localhost/mysite/?p=1344</guid>

					<description><![CDATA[<p>Large-Scale Language Model + Reinforcement learning from human feedback = Helpful Chat Agent</p>



<h3 class="wp-block-heading">回顾 OpenAI GPT 的规模升级之路</h3>



<p>在对话智能体应用大火的今天，回顾第一个杀手级应用 ChatGPT 被研发出来之前经历的事情格外有趣。从其创造者&#8230;</p>]]></description>
										<content:encoded><![CDATA[<p>Large-Scale Language Model + Reinforcement learning from human feedback = Helpful Chat Agent</p>



<h3 class="wp-block-heading">回顾 OpenAI GPT 的规模升级之路</h3>



<p>在对话智能体应用大火的今天，回顾第一个杀手级应用 ChatGPT 被研发出来之前经历的事情格外有趣。从其创造者&hellip;</p>]]></content:encoded>
					
					<wfw:commentRss>https://blog.ziaowang.top/2024/06/16/llm-rlhf-chat-agent/feed/</wfw:commentRss>
			<slash:comments>0</slash:comments>
		
		
			</item>
	</channel>
</rss>
