<?xml version="1.0" encoding="UTF-8" ?>
<rss
    version="2.0"
    xmlns:atom="http://www.w3.org/2005/Atom"
    xmlns:content="http://purl.org/rss/1.0/modules/content/"
    xmlns:webfeeds="http://webfeeds.org/rss/1.0"
    xmlns:media="http://search.yahoo.com/mrss/"
    >
    <channel>
        <title>Direct-preference-optimization Tag - Viblo</title>
        <link>https://viblo.asia/rss</link>
        <description><![CDATA[Free service for technical knowledge sharing]]></description>
        <atom:link href="https://viblo.asia/rss/tags/direct-preference-optimization.rss" rel="self"></atom:link>
                <copyright>Sun* Inc.</copyright>
                                                <webfeeds:logo>https://viblo.asia/logo_full.svg</webfeeds:logo>
        <image>
            <url>https://viblo.asia/logo_full.svg</url>
            <title>Direct-preference-optimization Tag - Viblo</title>
            <link>https://viblo.asia/rss</link>
        </image>
                                <language>vi-vn</language>
        <lastBuildDate>2026-06-13T20:39:27+07:00</lastBuildDate>
                <item>
            <title><![CDATA[RLHF &amp; DPO: Kỹ thuật mới đơn giản hơn, tăng cường khả năng Fine-tuning cho Large language models]]></title>
                        <link>https://viblo.asia/p/rlhf-dpo-ky-thuat-moi-don-gian-hon-tang-cuong-kha-nang-fine-tuning-cho-large-language-models-zXRJ8bnZVGq</link>
            <guid isPermaLink="true">https://viblo.asia/p/rlhf-dpo-ky-thuat-moi-don-gian-hon-tang-cuong-kha-nang-fine-tuning-cho-large-language-models-zXRJ8bnZVGq</guid>
            <description><![CDATA[RLHF là gì?

Reinforcement Learning from Human Feedback (RLHF) là một phương pháp mới, tiên tiến trong lĩnh vực Trí tuệ nhân tạo (AI) được nổi lên với...]]></description>
                        <dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">Phuc Phan</dc:creator>
            <pubDate>2023-12-13 18:51:24</pubDate>
                                                                                                        </item>
            </channel>
</rss>
