<?xml version="1.0"?>
<feed xmlns="http://www.w3.org/2005/Atom" xml:lang="ko">
	<id>https://w.ryanyang.kr/index.php?action=history&amp;feed=atom&amp;title=Reinforcement_Learning_from_Human_Feedback</id>
	<title>Reinforcement Learning from Human Feedback - 편집 역사</title>
	<link rel="self" type="application/atom+xml" href="https://w.ryanyang.kr/index.php?action=history&amp;feed=atom&amp;title=Reinforcement_Learning_from_Human_Feedback"/>
	<link rel="alternate" type="text/html" href="https://w.ryanyang.kr/index.php?title=Reinforcement_Learning_from_Human_Feedback&amp;action=history"/>
	<updated>2026-04-18T12:40:02Z</updated>
	<subtitle>이 문서의 편집 역사</subtitle>
	<generator>MediaWiki 1.37.1</generator>
	<entry>
		<id>https://w.ryanyang.kr/index.php?title=Reinforcement_Learning_from_Human_Feedback&amp;diff=3944&amp;oldid=prev</id>
		<title>Ryanyang: 새 문서: A short introduction to RLHF and post-training focused on language models by Nathan Lambert   https://rlhfbook.com/ 분류:2026 분류:AI 분류:Book 분류:인공지능 분류:RLHF 분류:강화학습 분류:Reinforcement Learning</title>
		<link rel="alternate" type="text/html" href="https://w.ryanyang.kr/index.php?title=Reinforcement_Learning_from_Human_Feedback&amp;diff=3944&amp;oldid=prev"/>
		<updated>2026-03-03T10:33:39Z</updated>

		<summary type="html">&lt;p&gt;새 문서: A short introduction to RLHF and post-training focused on language models by Nathan Lambert   https://rlhfbook.com/ &lt;a href=&quot;/index.php?title=%EB%B6%84%EB%A5%98:2026&amp;amp;action=edit&amp;amp;redlink=1&quot; class=&quot;new&quot; title=&quot;분류:2026 (없는 문서)&quot;&gt;분류:2026&lt;/a&gt; &lt;a href=&quot;/index.php?title=%EB%B6%84%EB%A5%98:AI&amp;amp;action=edit&amp;amp;redlink=1&quot; class=&quot;new&quot; title=&quot;분류:AI (없는 문서)&quot;&gt;분류:AI&lt;/a&gt; &lt;a href=&quot;/index.php?title=%EB%B6%84%EB%A5%98:Book&amp;amp;action=edit&amp;amp;redlink=1&quot; class=&quot;new&quot; title=&quot;분류:Book (없는 문서)&quot;&gt;분류:Book&lt;/a&gt; &lt;a href=&quot;/index.php?title=%EB%B6%84%EB%A5%98:%EC%9D%B8%EA%B3%B5%EC%A7%80%EB%8A%A5&amp;amp;action=edit&amp;amp;redlink=1&quot; class=&quot;new&quot; title=&quot;분류:인공지능 (없는 문서)&quot;&gt;분류:인공지능&lt;/a&gt; &lt;a href=&quot;/index.php?title=%EB%B6%84%EB%A5%98:RLHF&amp;amp;action=edit&amp;amp;redlink=1&quot; class=&quot;new&quot; title=&quot;분류:RLHF (없는 문서)&quot;&gt;분류:RLHF&lt;/a&gt; &lt;a href=&quot;/index.php?title=%EB%B6%84%EB%A5%98:%EA%B0%95%ED%99%94%ED%95%99%EC%8A%B5&amp;amp;action=edit&amp;amp;redlink=1&quot; class=&quot;new&quot; title=&quot;분류:강화학습 (없는 문서)&quot;&gt;분류:강화학습&lt;/a&gt; &lt;a href=&quot;/index.php?title=%EB%B6%84%EB%A5%98:Reinforcement_Learning&amp;amp;action=edit&amp;amp;redlink=1&quot; class=&quot;new&quot; title=&quot;분류:Reinforcement Learning (없는 문서)&quot;&gt;분류:Reinforcement Learning&lt;/a&gt;&lt;/p&gt;
&lt;p&gt;&lt;b&gt;새 문서&lt;/b&gt;&lt;/p&gt;&lt;div&gt;A short introduction to RLHF and post-training focused on language models by Nathan Lambert&lt;br /&gt;
&lt;br /&gt;
&lt;br /&gt;
https://rlhfbook.com/&lt;br /&gt;
[[분류:2026]]&lt;br /&gt;
[[분류:AI]]&lt;br /&gt;
[[분류:Book]]&lt;br /&gt;
[[분류:인공지능]]&lt;br /&gt;
[[분류:RLHF]]&lt;br /&gt;
[[분류:강화학습]]&lt;br /&gt;
[[분류:Reinforcement Learning]]&lt;/div&gt;</summary>
		<author><name>Ryanyang</name></author>
	</entry>
</feed>