<?xml version="1.0" encoding="utf-8"?>
<?xml-stylesheet type="text/css" href="http://www.recognition.su/wiki/skins/common/feed.css?116"?>
<rss version="2.0" xmlns:dc="http://purl.org/dc/elements/1.1/">
	<channel>
		<title>MachineLearning - Связанные правки для Direct Preference Optimization [ru]</title>
		<link>http://www.recognition.su/wiki/index.php?title=%D0%A1%D0%BB%D1%83%D0%B6%D0%B5%D0%B1%D0%BD%D0%B0%D1%8F:Recentchangeslinked</link>
		<description>Связанные правки</description>
		<language>ru</language>
		<generator>MediaWiki 1.12.0</generator>
		<lastBuildDate>Tue, 16 Jun 2026 20:09:38 GMT</lastBuildDate>
		<item>
			<title>Chain-of-thoughts</title>
			<link>http://www.recognition.su/wiki/index.php?title=Chain-of-thoughts&amp;diff=107356&amp;oldid=prev</link>
			<description>&lt;p&gt;Новая: {{well|Статья написана с использованием LLM '''OpenAI GPT-5.4''' и проверена участником ~~~~}}  '''Chain-of-thoughts''' (часто со...&lt;/p&gt;
</description>
			<pubDate>Tue, 16 Jun 2026 12:24:30 GMT</pubDate>			<dc:creator>Ilia Prokofev</dc:creator>			<comments>http://www.recognition.su/wiki/index.php?title=%D0%9E%D0%B1%D1%81%D1%83%D0%B6%D0%B4%D0%B5%D0%BD%D0%B8%D0%B5:Chain-of-thoughts</comments>		</item>
		<item>
			<title>Большая языковая модель</title>
			<link>http://www.recognition.su/wiki/index.php?title=%D0%91%D0%BE%D0%BB%D1%8C%D1%88%D0%B0%D1%8F_%D1%8F%D0%B7%D1%8B%D0%BA%D0%BE%D0%B2%D0%B0%D1%8F_%D0%BC%D0%BE%D0%B4%D0%B5%D0%BB%D1%8C&amp;diff=107331&amp;oldid=prev</link>
			<description>&lt;p&gt;Исправлены формулы LaTeX&lt;/p&gt;
</description>
			<pubDate>Tue, 16 Jun 2026 10:58:16 GMT</pubDate>			<dc:creator>Emil Petrov</dc:creator>			<comments>http://www.recognition.su/wiki/index.php?title=%D0%9E%D0%B1%D1%81%D1%83%D0%B6%D0%B4%D0%B5%D0%BD%D0%B8%D0%B5:%D0%91%D0%BE%D0%BB%D1%8C%D1%88%D0%B0%D1%8F_%D1%8F%D0%B7%D1%8B%D0%BA%D0%BE%D0%B2%D0%B0%D1%8F_%D0%BC%D0%BE%D0%B4%D0%B5%D0%BB%D1%8C</comments>		</item>
		<item>
			<title>Group Relative Policy Optimization</title>
			<link>http://www.recognition.su/wiki/index.php?title=Group_Relative_Policy_Optimization&amp;diff=107320&amp;oldid=prev</link>
			<description>&lt;p&gt;&lt;/p&gt;
</description>
			<pubDate>Tue, 16 Jun 2026 09:41:03 GMT</pubDate>			<dc:creator>Ilia Prokofev</dc:creator>			<comments>http://www.recognition.su/wiki/index.php?title=%D0%9E%D0%B1%D1%81%D1%83%D0%B6%D0%B4%D0%B5%D0%BD%D0%B8%D0%B5:Group_Relative_Policy_Optimization</comments>		</item>
	</channel>
</rss>