{
    "author": null,
    "date_published": null,
    "dek": null,
    "direction": "ltr",
    "domain": "kylrth.com",
    "excerpt": "Posted on 2022-02-09 at 20:47:59 UTC-0500deep-learning neural-scalingThis paper is all about trying a bunch of different changes to the training setup to see what affects the power law exponent over&hellip;",
    "lead_image_url": null,
    "next_page_url": null,
    "rendered_pages": 1,
    "title": "Data scaling laws in NMT: the effect of noise and architecture",
    "total_pages": 1,
    "url": "https://kylrth.com/paper/data-scaling-laws-nmt/",
    "word_count": 7
}