[ { "Accuracy (Dev)": 74.9, "Accuracy (Test-P)": 74.5, "Accuracy (Test-U)": 76.2, "code_links": [ { "title": "airsplay/lxmert", "url": "https://github.com/airsplay/lxmert" } ], "date": "2019-08-20", "date2": 20190820, "model": "LXMERT", "paper": { "title": "LXMERT: Learning Cross-Modality Encoder Representations from Transformers", "url": "https://cknow.io/lib/94cc9b3f81429e25" }, "paper_data_uoa": "94cc9b3f81429e25" }, { "Accuracy (Dev)": 67.4, "Accuracy (Test-P)": 67, "Accuracy (Test-U)": 67.3, "code_links": [ { "title": "uclanlp/visualbert", "url": "https://github.com/uclanlp/visualbert" } ], "date": "2019-08-09", "date2": 20190809, "model": "VisualBERT", "paper": { "title": "VisualBERT: A Simple and Performant Baseline for Vision and Language", "url": "https://cknow.io/lib/faaef4b6d973abbf" }, "paper_data_uoa": "faaef4b6d973abbf" } ]