<?xml version="1.0" encoding="UTF-8"?>
<!-- generator="FeedCreator 1.8" -->
<?xml-stylesheet href="https://jlab.soe.ucsc.edu/nlp-wiki/lib/exe/css.php?s=feed" type="text/css"?>
<rdf:RDF
    xmlns="http://purl.org/rss/1.0/"
    xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#"
    xmlns:slash="http://purl.org/rss/1.0/modules/slash/"
    xmlns:dc="http://purl.org/dc/elements/1.1/">
    <channel rdf:about="https://jlab.soe.ucsc.edu/nlp-wiki/feed.php">
        <title>NLP Wiki paper</title>
        <description></description>
        <link>https://jlab.soe.ucsc.edu/nlp-wiki/</link>
        <image rdf:resource="https://jlab.soe.ucsc.edu/nlp-wiki/lib/tpl/dokuwiki/images/favicon.ico" />
       <dc:date>2026-05-11T09:20:35+00:00</dc:date>
        <items>
            <rdf:Seq>
                <rdf:li rdf:resource="https://jlab.soe.ucsc.edu/nlp-wiki/doku.php?id=paper:a_tutorial_on_deep_latent_variable_models_of_natural_language&amp;rev=1686814574&amp;do=diff"/>
                <rdf:li rdf:resource="https://jlab.soe.ucsc.edu/nlp-wiki/doku.php?id=paper:discriminative_training_methods_for_hidden_markov_models_-_theory_and_experiments_with_perceptron_algorithms&amp;rev=1686814574&amp;do=diff"/>
                <rdf:li rdf:resource="https://jlab.soe.ucsc.edu/nlp-wiki/doku.php?id=paper:dual_learning_for_machine_translation&amp;rev=1686814574&amp;do=diff"/>
                <rdf:li rdf:resource="https://jlab.soe.ucsc.edu/nlp-wiki/doku.php?id=paper:etc&amp;rev=1686814574&amp;do=diff"/>
                <rdf:li rdf:resource="https://jlab.soe.ucsc.edu/nlp-wiki/doku.php?id=paper:experience_grounds_language&amp;rev=1686814574&amp;do=diff"/>
                <rdf:li rdf:resource="https://jlab.soe.ucsc.edu/nlp-wiki/doku.php?id=paper:language_models_are_few-shot_learners&amp;rev=1686814574&amp;do=diff"/>
                <rdf:li rdf:resource="https://jlab.soe.ucsc.edu/nlp-wiki/doku.php?id=paper:language_models_are_unsupervised_multitask_learners&amp;rev=1686814574&amp;do=diff"/>
                <rdf:li rdf:resource="https://jlab.soe.ucsc.edu/nlp-wiki/doku.php?id=paper:megatron-lm_training_multi-billion_parameter_language_models_using_model_parallelism&amp;rev=1686814574&amp;do=diff"/>
                <rdf:li rdf:resource="https://jlab.soe.ucsc.edu/nlp-wiki/doku.php?id=paper:mikolov_2013_-_distributed_representations_of_words_and_phrases_and_their_compositionality&amp;rev=1686814574&amp;do=diff"/>
                <rdf:li rdf:resource="https://jlab.soe.ucsc.edu/nlp-wiki/doku.php?id=paper:mikolov_2013_-_efficient_estimation_of_word_representations_in_vector_space&amp;rev=1686814574&amp;do=diff"/>
                <rdf:li rdf:resource="https://jlab.soe.ucsc.edu/nlp-wiki/doku.php?id=paper:schwartz_2018_-_sopa_bridging_cnns_rnns_and_weighted_finite-state_machines&amp;rev=1686814574&amp;do=diff"/>
                <rdf:li rdf:resource="https://jlab.soe.ucsc.edu/nlp-wiki/doku.php?id=paper:the_sample_complexity_of_agnostic_learning_under_deterministic_labels&amp;rev=1686814574&amp;do=diff"/>
            </rdf:Seq>
        </items>
    </channel>
    <image rdf:about="https://jlab.soe.ucsc.edu/nlp-wiki/lib/tpl/dokuwiki/images/favicon.ico">
        <title>NLP Wiki</title>
        <link>https://jlab.soe.ucsc.edu/nlp-wiki/</link>
        <url>https://jlab.soe.ucsc.edu/nlp-wiki/lib/tpl/dokuwiki/images/favicon.ico</url>
    </image>
    <item rdf:about="https://jlab.soe.ucsc.edu/nlp-wiki/doku.php?id=paper:a_tutorial_on_deep_latent_variable_models_of_natural_language&amp;rev=1686814574&amp;do=diff">
        <dc:format>text/html</dc:format>
        <dc:date>2023-06-15T07:36:14+00:00</dc:date>
        <dc:creator>Anonymous (anonymous@undisclosed.example.com)</dc:creator>
        <title>paper:a_tutorial_on_deep_latent_variable_models_of_natural_language</title>
        <link>https://jlab.soe.ucsc.edu/nlp-wiki/doku.php?id=paper:a_tutorial_on_deep_latent_variable_models_of_natural_language&amp;rev=1686814574&amp;do=diff</link>
        <description>A Tutorial on Deep Latent Variable Models of Natural Language

Kim et al 2019 - A Tutorial on Deep Latent Variable Models of Natural Language</description>
    </item>
    <item rdf:about="https://jlab.soe.ucsc.edu/nlp-wiki/doku.php?id=paper:discriminative_training_methods_for_hidden_markov_models_-_theory_and_experiments_with_perceptron_algorithms&amp;rev=1686814574&amp;do=diff">
        <dc:format>text/html</dc:format>
        <dc:date>2023-06-15T07:36:14+00:00</dc:date>
        <dc:creator>Anonymous (anonymous@undisclosed.example.com)</dc:creator>
        <title>paper:discriminative_training_methods_for_hidden_markov_models_-_theory_and_experiments_with_perceptron_algorithms</title>
        <link>https://jlab.soe.ucsc.edu/nlp-wiki/doku.php?id=paper:discriminative_training_methods_for_hidden_markov_models_-_theory_and_experiments_with_perceptron_algorithms&amp;rev=1686814574&amp;do=diff</link>
        <description>Discriminative Training Methods for Hidden Markov Models - Theory and Experiments with Perceptron Algorithms

Discriminative Training Methods for Hidden Markov Models - Theory and Experiments with Perceptron Algorithms</description>
    </item>
    <item rdf:about="https://jlab.soe.ucsc.edu/nlp-wiki/doku.php?id=paper:dual_learning_for_machine_translation&amp;rev=1686814574&amp;do=diff">
        <dc:format>text/html</dc:format>
        <dc:date>2023-06-15T07:36:14+00:00</dc:date>
        <dc:creator>Anonymous (anonymous@undisclosed.example.com)</dc:creator>
        <title>paper:dual_learning_for_machine_translation</title>
        <link>https://jlab.soe.ucsc.edu/nlp-wiki/doku.php?id=paper:dual_learning_for_machine_translation&amp;rev=1686814574&amp;do=diff</link>
        <description>Dual Learning For Machine Translation

Dual Learning For Machine Translation

TLDR; The authors cast machine translation as a game of a primal task and a dual task, which allows two agents to teach each other in a reinforcement learning fashion (i.e., policy gradient method). With this implementation, the agent only requires monolingual English</description>
    </item>
    <item rdf:about="https://jlab.soe.ucsc.edu/nlp-wiki/doku.php?id=paper:etc&amp;rev=1686814574&amp;do=diff">
        <dc:format>text/html</dc:format>
        <dc:date>2023-06-15T07:36:14+00:00</dc:date>
        <dc:creator>Anonymous (anonymous@undisclosed.example.com)</dc:creator>
        <title>paper:etc</title>
        <link>https://jlab.soe.ucsc.edu/nlp-wiki/doku.php?id=paper:etc&amp;rev=1686814574&amp;do=diff</link>
        <description>ETC: Encoding Long and Structured Inputs in Transformers

ETC: Encoding Long and Structured Inputs in Transformers

TLDR; ETC encodes long inputs using global-local attention and represents structures by combining relative position representations and flexible masking. It also employs CPC pre-training for hierarchical global tokens (structures).</description>
    </item>
    <item rdf:about="https://jlab.soe.ucsc.edu/nlp-wiki/doku.php?id=paper:experience_grounds_language&amp;rev=1686814574&amp;do=diff">
        <dc:format>text/html</dc:format>
        <dc:date>2023-06-15T07:36:14+00:00</dc:date>
        <dc:creator>Anonymous (anonymous@undisclosed.example.com)</dc:creator>
        <title>paper:experience_grounds_language</title>
        <link>https://jlab.soe.ucsc.edu/nlp-wiki/doku.php?id=paper:experience_grounds_language&amp;rev=1686814574&amp;do=diff</link>
        <description>Experience Grounds Language

Experience Grounds Language

TLDR; Current models trained only from text corpora might hinder the language understanding research because the supervision from text alone can be limited, so we need to embed social context. The authors proposed the notion of World Scopes (WS), which considers not only the text corpus but also grounding, embodiment, and social interaction.</description>
    </item>
    <item rdf:about="https://jlab.soe.ucsc.edu/nlp-wiki/doku.php?id=paper:language_models_are_few-shot_learners&amp;rev=1686814574&amp;do=diff">
        <dc:format>text/html</dc:format>
        <dc:date>2023-06-15T07:36:14+00:00</dc:date>
        <dc:creator>Anonymous (anonymous@undisclosed.example.com)</dc:creator>
        <title>paper:language_models_are_few-shot_learners</title>
        <link>https://jlab.soe.ucsc.edu/nlp-wiki/doku.php?id=paper:language_models_are_few-shot_learners&amp;rev=1686814574&amp;do=diff</link>
        <description>Language Models are Few-Shot Learners

Language Models are Few-Shot Learners</description>
    </item>
    <item rdf:about="https://jlab.soe.ucsc.edu/nlp-wiki/doku.php?id=paper:language_models_are_unsupervised_multitask_learners&amp;rev=1686814574&amp;do=diff">
        <dc:format>text/html</dc:format>
        <dc:date>2023-06-15T07:36:14+00:00</dc:date>
        <dc:creator>Anonymous (anonymous@undisclosed.example.com)</dc:creator>
        <title>paper:language_models_are_unsupervised_multitask_learners</title>
        <link>https://jlab.soe.ucsc.edu/nlp-wiki/doku.php?id=paper:language_models_are_unsupervised_multitask_learners&amp;rev=1686814574&amp;do=diff</link>
        <description>Language Models are Unsupervised Multitask Learners

Language Models are Unsupervised Multitask Learners

	*  Code: &lt;https://github.com/openai/gpt-2&gt;
	*  Open-source clone of the dataset: OpenWebText (from &lt;https://github.com/NVIDIA/Megatron-LM&gt;)</description>
    </item>
    <item rdf:about="https://jlab.soe.ucsc.edu/nlp-wiki/doku.php?id=paper:megatron-lm_training_multi-billion_parameter_language_models_using_model_parallelism&amp;rev=1686814574&amp;do=diff">
        <dc:format>text/html</dc:format>
        <dc:date>2023-06-15T07:36:14+00:00</dc:date>
        <dc:creator>Anonymous (anonymous@undisclosed.example.com)</dc:creator>
        <title>paper:megatron-lm_training_multi-billion_parameter_language_models_using_model_parallelism</title>
        <link>https://jlab.soe.ucsc.edu/nlp-wiki/doku.php?id=paper:megatron-lm_training_multi-billion_parameter_language_models_using_model_parallelism&amp;rev=1686814574&amp;do=diff</link>
        <description>Megatron-LM: Training Multi-Billion Parameter Language Models Using Model Parallelism

Megatron-LM: Training Multi-Billion Parameter Language Models Using
Model Parallelism

	*  Follow-up blog post: State-of-the-Art Language Modeling Using Megatron on the NVIDIA A100 GPU</description>
    </item>
    <item rdf:about="https://jlab.soe.ucsc.edu/nlp-wiki/doku.php?id=paper:mikolov_2013_-_distributed_representations_of_words_and_phrases_and_their_compositionality&amp;rev=1686814574&amp;do=diff">
        <dc:format>text/html</dc:format>
        <dc:date>2023-06-15T07:36:14+00:00</dc:date>
        <dc:creator>Anonymous (anonymous@undisclosed.example.com)</dc:creator>
        <title>paper:mikolov_2013_-_distributed_representations_of_words_and_phrases_and_their_compositionality</title>
        <link>https://jlab.soe.ucsc.edu/nlp-wiki/doku.php?id=paper:mikolov_2013_-_distributed_representations_of_words_and_phrases_and_their_compositionality&amp;rev=1686814574&amp;do=diff</link>
        <description>Distributed Representations of Words and Phrases and their Compositionality

Distributed Representations of Words and Phrases and their Compositionality</description>
    </item>
    <item rdf:about="https://jlab.soe.ucsc.edu/nlp-wiki/doku.php?id=paper:mikolov_2013_-_efficient_estimation_of_word_representations_in_vector_space&amp;rev=1686814574&amp;do=diff">
        <dc:format>text/html</dc:format>
        <dc:date>2023-06-15T07:36:14+00:00</dc:date>
        <dc:creator>Anonymous (anonymous@undisclosed.example.com)</dc:creator>
        <title>paper:mikolov_2013_-_efficient_estimation_of_word_representations_in_vector_space</title>
        <link>https://jlab.soe.ucsc.edu/nlp-wiki/doku.php?id=paper:mikolov_2013_-_efficient_estimation_of_word_representations_in_vector_space&amp;rev=1686814574&amp;do=diff</link>
        <description>Efficient Estimation of Word Representations in Vector Space

Efficient Estimation of Word Representations in Vector Space

Follow-up work: Mikolov 2013 - Distributed Representations of Words and Phrases and their Compositionality</description>
    </item>
    <item rdf:about="https://jlab.soe.ucsc.edu/nlp-wiki/doku.php?id=paper:schwartz_2018_-_sopa_bridging_cnns_rnns_and_weighted_finite-state_machines&amp;rev=1686814574&amp;do=diff">
        <dc:format>text/html</dc:format>
        <dc:date>2023-06-15T07:36:14+00:00</dc:date>
        <dc:creator>Anonymous (anonymous@undisclosed.example.com)</dc:creator>
        <title>paper:schwartz_2018_-_sopa_bridging_cnns_rnns_and_weighted_finite-state_machines</title>
        <link>https://jlab.soe.ucsc.edu/nlp-wiki/doku.php?id=paper:schwartz_2018_-_sopa_bridging_cnns_rnns_and_weighted_finite-state_machines&amp;rev=1686814574&amp;do=diff</link>
        <description>SoPa: Bridging CNNs, RNNs, and Weighted Finite-State Machines

SoPa: Bridging CNNs, RNNs, and Weighted Finite-State Machines</description>
    </item>
    <item rdf:about="https://jlab.soe.ucsc.edu/nlp-wiki/doku.php?id=paper:the_sample_complexity_of_agnostic_learning_under_deterministic_labels&amp;rev=1686814574&amp;do=diff">
        <dc:format>text/html</dc:format>
        <dc:date>2023-06-15T07:36:14+00:00</dc:date>
        <dc:creator>Anonymous (anonymous@undisclosed.example.com)</dc:creator>
        <title>paper:the_sample_complexity_of_agnostic_learning_under_deterministic_labels</title>
        <link>https://jlab.soe.ucsc.edu/nlp-wiki/doku.php?id=paper:the_sample_complexity_of_agnostic_learning_under_deterministic_labels&amp;rev=1686814574&amp;do=diff</link>
        <description>Paper: The sample complexity of agnostic learning under deterministic labels

The sample complexity of agnostic learning under deterministic labels</description>
    </item>
</rdf:RDF>
