{
    "author": null,
    "date_published": "2022-02-04T00:00:00.000Z",
    "dek": null,
    "direction": "ltr",
    "domain": "arxiv.org",
    "excerpt": "In this work, we study the effect of varying the architecture and training data quality on the data scaling properties of Neural Machine Translation (NMT). First, we establish that the test loss of&hellip;",
    "lead_image_url": "https://static.arxiv.org/icons/twitter/arxiv-logo-twitter-square.png",
    "next_page_url": null,
    "rendered_pages": 1,
    "title": "Data Scaling Laws in NMT: The Effect of Noise and Architecture",
    "total_pages": 1,
    "url": "https://arxiv.org/abs/2202.01994v1",
    "word_count": 179
}