From 63db20f4f676df369a70aa3de44ba46bf333ddf3 Mon Sep 17 00:00:00 2001
From: acl-pwc-bot <94475230+acl-pwc-bot@users.noreply.github.com>
Date: Thu, 7 Mar 2024 02:05:14 +0100
Subject: [PATCH] Update metadata from Papers with Code

---
 data/xml/2016.iwslt.xml    |  1 +
 data/xml/2018.iwslt.xml    |  1 +
 data/xml/2019.iwslt.xml    |  2 +-
 data/xml/2020.acl.xml      |  9 +++++++++
 data/xml/2020.bea.xml      |  1 +
 data/xml/2020.coling.xml   |  1 +
 data/xml/2020.emnlp.xml    |  5 +++++
 data/xml/2020.findings.xml |  3 +++
 data/xml/2020.iwslt.xml    |  2 +-
 data/xml/2020.lrec.xml     |  1 +
 data/xml/2020.repl4nlp.xml |  1 +
 data/xml/2021.acl.xml      |  7 +++++++
 data/xml/2021.eacl.xml     |  1 +
 data/xml/2021.emnlp.xml    |  7 ++++++-
 data/xml/2021.findings.xml |  4 ++++
 data/xml/2021.iwslt.xml    |  3 +--
 data/xml/2021.naacl.xml    |  1 +
 data/xml/2021.ranlp.xml    |  1 +
 data/xml/2022.acl.xml      |  4 ++++
 data/xml/2022.coling.xml   |  2 ++
 data/xml/2022.findings.xml |  1 +
 data/xml/2022.iwslt.xml    |  4 +---
 data/xml/2022.lrec.xml     |  1 +
 data/xml/2022.naacl.xml    |  5 ++++-
 data/xml/2022.rocling.xml  |  2 +-
 data/xml/C18.xml           |  4 ++++
 data/xml/D11.xml           |  1 +
 data/xml/D14.xml           |  1 +
 data/xml/D17.xml           |  6 +++++-
 data/xml/D18.xml           | 10 ++++++++++
 data/xml/D19.xml           | 12 ++++++++++++
 data/xml/E17.xml           |  1 +
 data/xml/K16.xml           |  1 +
 data/xml/K18.xml           |  1 +
 data/xml/K19.xml           |  3 +++
 data/xml/L16.xml           |  2 +-
 data/xml/N16.xml           |  1 +
 data/xml/N18.xml           |  8 ++++++++
 data/xml/N19.xml           |  3 +++
 data/xml/P16.xml           |  4 ++++
 data/xml/P17.xml           |  5 +++++
 data/xml/P18.xml           | 12 ++++++++++++
 data/xml/P19.xml           | 11 +++++++++++
 data/xml/Q16.xml           |  1 +
 data/xml/Q17.xml           |  1 +
 data/xml/S14.xml           |  2 +-
 data/xml/W12.xml           |  1 -
 data/xml/W14.xml           |  2 +-
 data/xml/W17.xml           |  2 ++
 data/xml/W18.xml           |  2 +-
 data/xml/W19.xml           |  1 +
 51 files changed, 152 insertions(+), 16 deletions(-)
diff --git a/data/xml/2016.iwslt.xml b/data/xml/2016.iwslt.xml
index e9b7eb89e2..55ce6b8121 100644
--- a/data/xml/2016.iwslt.xml
+++ b/data/xml/2016.iwslt.xml
@@ -96,6 +96,7 @@
       <url hash="30f93f67">2016.iwslt-1.8</url>
       <bibkey>lazaridis-etal-2016-investigating</bibkey>
       <pwcdataset url="https://paperswithcode.com/dataset/librispeech">LibriSpeech</pwcdataset>
+      <pwcdataset url="https://paperswithcode.com/dataset/ted-lium-3">TED-LIUM</pwcdataset>
     </paper>
     <paper id="9">
       <title>Towards Improving Low-Resource Speech Recognition Using Articulatory and Language Features</title>
diff --git a/data/xml/2018.iwslt.xml b/data/xml/2018.iwslt.xml
index a33f3adc49..be2b5c991e 100644
--- a/data/xml/2018.iwslt.xml
+++ b/data/xml/2018.iwslt.xml
@@ -167,6 +167,7 @@
       <abstract>This paper describes the MeMAD project entry to the IWSLT Speech Translation Shared Task, addressing the translation of English audio into German text. Between the pipeline and end-to-end model tracks, we participated only in the former, with three contrastive systems. We tried also the latter, but were not able to finish our end-to-end model in time. All of our systems start by transcribing the audio into text through an automatic speech recognition (ASR) model trained on the TED-LIUM English Speech Recognition Corpus (TED-LIUM). Afterwards, we feed the transcripts into English-German text-based neural machine translation (NMT) models. Our systems employ three different translation models trained on separate training sets compiled from the English-German part of the TED Speech Translation Corpus (TED-TRANS) and the OPENSUBTITLES2018 section of the OPUS collection. In this paper, we also describe the experiments leading up to our final systems. Our experiments indicate that using OPENSUBTITLES2018 in training significantly improves translation performance. We also experimented with various preand postprocessing routines for the NMT module, but we did not have much success with these. Our best-scoring system attains a BLEU score of 16.45 on the test set for this year’s task.</abstract>
       <url hash="9b99e769">2018.iwslt-1.13</url>
       <bibkey>sulubacak-etal-2018-memad</bibkey>
+      <pwcdataset url="https://paperswithcode.com/dataset/ted-lium-3">TED-LIUM</pwcdataset>
     </paper>
     <paper id="14">
       <title>Prompsit’s Submission to the <fixed-case>IWSLT</fixed-case> 2018 Low Resource Machine Translation Task</title>
diff --git a/data/xml/2019.iwslt.xml b/data/xml/2019.iwslt.xml
index 2e0f94d663..c3c8fa0e3b 100644
--- a/data/xml/2019.iwslt.xml
+++ b/data/xml/2019.iwslt.xml
@@ -74,6 +74,7 @@
       <bibkey>inaguma-etal-2019-espnet</bibkey>
       <pwcdataset url="https://paperswithcode.com/dataset/librispeech">LibriSpeech</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/must-c">MuST-C</pwcdataset>
+      <pwcdataset url="https://paperswithcode.com/dataset/ted-lium-3">TED-LIUM</pwcdataset>
     </paper>
     <paper id="5">
       <title><fixed-case>ON</fixed-case>-<fixed-case>TRAC</fixed-case> Consortium End-to-End Speech Translation Systems for the <fixed-case>IWSLT</fixed-case> 2019 Shared Task</title>
@@ -82,7 +83,6 @@
       <url hash="4b4966fb">2019.iwslt-1.5</url>
       <bibkey>nguyen-2019-trac</bibkey>
       <pwcdataset url="https://paperswithcode.com/dataset/must-c">MuST-C</pwcdataset>
-      <pwcdataset url="https://paperswithcode.com/dataset/ted-lium-3">TED-LIUM 3</pwcdataset>
     </paper>
     <paper id="6">
       <title>Transformer-based Cascaded Multimodal Speech Translation</title>
diff --git a/data/xml/2020.acl.xml b/data/xml/2020.acl.xml
index 6b9bcea021..39a0430720 100644
--- a/data/xml/2020.acl.xml
+++ b/data/xml/2020.acl.xml
@@ -673,6 +673,7 @@
       <video href="http://slideslive.com/38928694"/>
       <bibkey>li-etal-2020-dice</bibkey>
       <pwccode url="https://github.com/ShannonAI/dice_loss_for_NLP" additional="true">ShannonAI/dice_loss_for_NLP</pwccode>
+      <pwcdataset url="https://paperswithcode.com/dataset/conll-1">CoNLL</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/conll-2003">CoNLL 2003</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/msra-cn-ner">MSRA CN NER</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/ontonotes-4-0">OntoNotes 4.0</pwcdataset>
@@ -2819,6 +2820,7 @@
       <video href="http://slideslive.com/38928920"/>
       <bibkey>jiang-etal-2020-generalizing</bibkey>
       <pwccode url="https://github.com/jzbjyb/SpanRel" additional="true">jzbjyb/SpanRel</pwccode>
+      <pwcdataset url="https://paperswithcode.com/dataset/conll-1">CoNLL</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/conll-2003">CoNLL 2003</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/conll-2012-1">CoNLL-2012</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/oie2016">OIE2016</pwcdataset>
@@ -4469,6 +4471,7 @@
       <video href="http://slideslive.com/38928756"/>
       <bibkey>zhang-etal-2020-efficient</bibkey>
       <pwccode url="https://github.com/yzhangcs/crfpar" additional="true">yzhangcs/crfpar</pwccode>
+      <pwcdataset url="https://paperswithcode.com/dataset/conll-1">CoNLL</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/conll-2009">CoNLL-2009</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/penn-treebank">Penn Treebank</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/universal-dependencies">Universal Dependencies</pwcdataset>
@@ -5764,6 +5767,7 @@
       <video href="http://slideslive.com/38929265"/>
       <bibkey>kaneko-etal-2020-encoder</bibkey>
       <pwccode url="https://github.com/kanekomasahiro/bert-gec" additional="false">kanekomasahiro/bert-gec</pwccode>
+      <pwcdataset url="https://paperswithcode.com/dataset/conll-1">CoNLL</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/conll-2014-shared-task-grammatical-error">CoNLL-2014 Shared Task: Grammatical Error Correction</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/jfleg">JFLEG</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/locness-corpus">WI-LOCNESS</pwcdataset>
@@ -7705,6 +7709,7 @@
       <pwccode url="https://github.com/ShannonAI/mrc-for-flat-nested-ner" additional="true">ShannonAI/mrc-for-flat-nested-ner</pwccode>
       <pwcdataset url="https://paperswithcode.com/dataset/ace-2004">ACE 2004</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/ace-2005">ACE 2005</pwcdataset>
+      <pwcdataset url="https://paperswithcode.com/dataset/conll-1">CoNLL</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/conll-2003">CoNLL 2003</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/genia">GENIA</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/msra-cn-ner">MSRA CN NER</pwcdataset>
@@ -8575,6 +8580,7 @@
       <pwccode url="https://github.com/juntaoy/biaffine-ner" additional="false">juntaoy/biaffine-ner</pwccode>
       <pwcdataset url="https://paperswithcode.com/dataset/ace-2004">ACE 2004</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/ace-2005">ACE 2005</pwcdataset>
+      <pwcdataset url="https://paperswithcode.com/dataset/conll-1">CoNLL</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/conll-2002">CoNLL 2002</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/conll-2003">CoNLL 2003</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/genia">GENIA</pwcdataset>
@@ -8637,6 +8643,7 @@
       <video href="http://slideslive.com/38929366"/>
       <bibkey>wu-etal-2020-single</bibkey>
       <pwccode url="https://github.com/microsoft/vert-papers/tree/master/papers/SingleMulti-TS" additional="false">microsoft/vert-papers</pwccode>
+      <pwcdataset url="https://paperswithcode.com/dataset/conll-1">CoNLL</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/conll-2002">CoNLL 2002</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/conll-2003">CoNLL 2003</pwcdataset>
     </paper>
@@ -9263,6 +9270,7 @@
       <video href="http://slideslive.com/38928701"/>
       <bibkey>wu-etal-2020-corefqa</bibkey>
       <pwccode url="https://github.com/ShannonAI/CorefQA" additional="false">ShannonAI/CorefQA</pwccode>
+      <pwcdataset url="https://paperswithcode.com/dataset/conll-1">CoNLL</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/conll-2012-1">CoNLL-2012</pwcdataset>
     </paper>
     <paper id="623">
@@ -11523,6 +11531,7 @@
       <doi>10.18653/v1/2020.acl-main.777</doi>
       <video href="http://slideslive.com/38929132"/>
       <bibkey>chen-etal-2020-seqvat</bibkey>
+      <pwcdataset url="https://paperswithcode.com/dataset/conll-1">CoNLL</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/conll-2000-1">CoNLL-2000</pwcdataset>
     </paper>
     <paper id="778">
diff --git a/data/xml/2020.bea.xml b/data/xml/2020.bea.xml
index 4fcc362477..bee05c222a 100644
--- a/data/xml/2020.bea.xml
+++ b/data/xml/2020.bea.xml
@@ -222,6 +222,7 @@
       <doi>10.18653/v1/2020.bea-1.16</doi>
       <bibkey>omelianchuk-etal-2020-gector</bibkey>
       <pwccode url="https://github.com/grammarly/gector" additional="true">grammarly/gector</pwccode>
+      <pwcdataset url="https://paperswithcode.com/dataset/conll-1">CoNLL</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/conll-2014-shared-task-grammatical-error">CoNLL-2014 Shared Task: Grammatical Error Correction</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/fce">FCE</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/locness-corpus">WI-LOCNESS</pwcdataset>
diff --git a/data/xml/2020.coling.xml b/data/xml/2020.coling.xml
index 715eb2bf3b..bde3738e4e 100644
--- a/data/xml/2020.coling.xml
+++ b/data/xml/2020.coling.xml
@@ -1051,6 +1051,7 @@
       <doi>10.18653/v1/2020.coling-main.78</doi>
       <bibkey>luoma-pyysalo-2020-exploring</bibkey>
       <pwccode url="https://github.com/jouniluoma/bert-ner-cmv" additional="false">jouniluoma/bert-ner-cmv</pwccode>
+      <pwcdataset url="https://paperswithcode.com/dataset/conll-1">CoNLL</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/conll-2002">CoNLL 2002</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/conll-2003">CoNLL 2003</pwcdataset>
     </paper>
diff --git a/data/xml/2020.emnlp.xml b/data/xml/2020.emnlp.xml
index b7a1791463..7bd13acca5 100644
--- a/data/xml/2020.emnlp.xml
+++ b/data/xml/2020.emnlp.xml
@@ -2042,6 +2042,7 @@
       <pwcdataset url="https://paperswithcode.com/dataset/ace-2004">ACE 2004</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/ace-2005">ACE 2005</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/ade-corpus">Adverse Drug Events (ADE) Corpus</pwcdataset>
+      <pwcdataset url="https://paperswithcode.com/dataset/conll-1">CoNLL</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/conll04">CoNLL04</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/fewrel">FewRel</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/wiki-zsl">Wiki-ZSL</pwcdataset>
@@ -7329,6 +7330,7 @@
       <bibkey>wang-etal-2020-ain</bibkey>
       <pwccode url="https://github.com/Alibaba-NLP/AIN" additional="false">Alibaba-NLP/AIN</pwccode>
       <pwcdataset url="https://paperswithcode.com/dataset/atis">ATIS</pwcdataset>
+      <pwcdataset url="https://paperswithcode.com/dataset/conll-1">CoNLL</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/conll-2003">CoNLL 2003</pwcdataset>
     </paper>
     <paper id="486">
@@ -7903,6 +7905,7 @@
       <video href="https://slideslive.com/38938803"/>
       <bibkey>yamada-etal-2020-luke</bibkey>
       <pwccode url="https://github.com/studio-ousia/luke" additional="true">studio-ousia/luke</pwccode>
+      <pwcdataset url="https://paperswithcode.com/dataset/conll-1">CoNLL</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/conll-2003">CoNLL 2003</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/open-entity-1">Open Entity</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/record">ReCoRD</pwcdataset>
@@ -10400,6 +10403,7 @@
       <video href="https://slideslive.com/38938926"/>
       <bibkey>toshniwal-etal-2020-learning</bibkey>
       <pwccode url="https://github.com/shtoshni92/long-doc-coref" additional="true">shtoshni92/long-doc-coref</pwccode>
+      <pwcdataset url="https://paperswithcode.com/dataset/conll-1">CoNLL</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/conll-2012-1">CoNLL-2012</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/ontonotes-5-0">OntoNotes 5.0</pwcdataset>
     </paper>
@@ -10414,6 +10418,7 @@
       <video href="https://slideslive.com/38938952"/>
       <bibkey>xu-choi-2020-revealing</bibkey>
       <pwccode url="https://github.com/lxucs/coref-hoi" additional="false">lxucs/coref-hoi</pwccode>
+      <pwcdataset url="https://paperswithcode.com/dataset/conll-1">CoNLL</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/conll-2012-1">CoNLL-2012</pwcdataset>
     </paper>
     <paper id="687">
diff --git a/data/xml/2020.findings.xml b/data/xml/2020.findings.xml
index a2a5c5b77e..9c25e740aa 100644
--- a/data/xml/2020.findings.xml
+++ b/data/xml/2020.findings.xml
@@ -417,6 +417,7 @@
       <doi>10.18653/v1/2020.findings-emnlp.28</doi>
       <video href="https://slideslive.com/38940127"/>
       <bibkey>chen-etal-2020-enhance</bibkey>
+      <pwcdataset url="https://paperswithcode.com/dataset/conll-1">CoNLL</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/conll-2003">CoNLL 2003</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/conll-2000-1">CoNLL-2000</pwcdataset>
     </paper>
@@ -4408,6 +4409,7 @@
       <video href="https://slideslive.com/38940634"/>
       <bibkey>szymanski-etal-2020-wer</bibkey>
       <pwcdataset url="https://paperswithcode.com/dataset/librispeech">LibriSpeech</pwcdataset>
+      <pwcdataset url="https://paperswithcode.com/dataset/ted-lium-3">TED-LIUM</pwcdataset>
     </paper>
     <paper id="296">
       <title>Detecting Stance in Media On Global Warming</title>
@@ -5278,6 +5280,7 @@
       <url hash="42f6e4b0">2020.findings-emnlp.356</url>
       <doi>10.18653/v1/2020.findings-emnlp.356</doi>
       <bibkey>wang-etal-2020-embeddings</bibkey>
+      <pwcdataset url="https://paperswithcode.com/dataset/conll-1">CoNLL</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/conll-2003">CoNLL 2003</pwcdataset>
     </paper>
     <paper id="357">
diff --git a/data/xml/2020.iwslt.xml b/data/xml/2020.iwslt.xml
index ecc137ab20..3e3ed98b70 100644
--- a/data/xml/2020.iwslt.xml
+++ b/data/xml/2020.iwslt.xml
@@ -75,7 +75,6 @@
       <bibkey>elbayad-etal-2020-trac</bibkey>
       <pwcdataset url="https://paperswithcode.com/dataset/how2">How2</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/must-c">MuST-C</pwcdataset>
-      <pwcdataset url="https://paperswithcode.com/dataset/ted-lium-3">TED-LIUM 3</pwcdataset>
     </paper>
     <paper id="3">
       <title>Start-Before-End and End-to-End: Neural Speech Translation by <fixed-case>A</fixed-case>pp<fixed-case>T</fixed-case>ek and <fixed-case>RWTH</fixed-case> <fixed-case>A</fixed-case>achen <fixed-case>U</fixed-case>niversity</title>
@@ -393,6 +392,7 @@
       <doi>10.18653/v1/2020.iwslt-1.25</doi>
       <video href="http://slideslive.com/38929595"/>
       <bibkey>machacek-etal-2020-elitr</bibkey>
+      <pwcdataset url="https://paperswithcode.com/dataset/ted-lium-3">TED-LIUM</pwcdataset>
     </paper>
     <paper id="26">
       <title>Is 42 the Answer to Everything in Subtitling-oriented Speech Translation?</title>
diff --git a/data/xml/2020.lrec.xml b/data/xml/2020.lrec.xml
index 49fc8e8a0c..6cfa06cf53 100644
--- a/data/xml/2020.lrec.xml
+++ b/data/xml/2020.lrec.xml
@@ -52,6 +52,7 @@
       <language>eng</language>
       <bibkey>yu-etal-2020-cluster</bibkey>
       <pwccode url="https://github.com/juntaoy/dali-full-anaphora" additional="false">juntaoy/dali-full-anaphora</pwccode>
+      <pwcdataset url="https://paperswithcode.com/dataset/conll-1">CoNLL</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/conll-2012-1">CoNLL-2012</pwcdataset>
     </paper>
     <paper id="3">
diff --git a/data/xml/2020.repl4nlp.xml b/data/xml/2020.repl4nlp.xml
index 9e278c20f0..ad843b81bd 100644
--- a/data/xml/2020.repl4nlp.xml
+++ b/data/xml/2020.repl4nlp.xml
@@ -33,6 +33,7 @@
       <doi>10.18653/v1/2020.repl4nlp-1.1</doi>
       <video href="http://slideslive.com/38929767"/>
       <bibkey>liu-etal-2020-zero</bibkey>
+      <pwcdataset url="https://paperswithcode.com/dataset/conll-1">CoNLL</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/conll04">CoNLL04</pwcdataset>
     </paper>
     <paper id="2">
diff --git a/data/xml/2021.acl.xml b/data/xml/2021.acl.xml
index 4756787fb9..8b6ebe1041 100644
--- a/data/xml/2021.acl.xml
+++ b/data/xml/2021.acl.xml
@@ -2301,6 +2301,7 @@
       <pwccode url="https://github.com/modelscope/adaseq" additional="true">modelscope/adaseq</pwccode>
       <pwcdataset url="https://paperswithcode.com/dataset/bc5cdr">BC5CDR</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/cmeee">CMeEE</pwcdataset>
+      <pwcdataset url="https://paperswithcode.com/dataset/conll-1">CoNLL</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/conll-2003">CoNLL 2003</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/conll">CoNLL++</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/conll-2000-1">CoNLL-2000</pwcdataset>
@@ -3366,6 +3367,7 @@
       <bibkey>wang-etal-2021-automated</bibkey>
       <video href="2021.acl-long.206.mp4"/>
       <pwccode url="https://github.com/Alibaba-NLP/ACE" additional="true">Alibaba-NLP/ACE</pwccode>
+      <pwcdataset url="https://paperswithcode.com/dataset/conll-1">CoNLL</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/conll-2002">CoNLL 2002</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/conll-2003">CoNLL 2003</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/conll-2000-1">CoNLL-2000</pwcdataset>
@@ -3527,6 +3529,7 @@
       <pwccode url="https://github.com/tricktreat/locate-and-label" additional="false">tricktreat/locate-and-label</pwccode>
       <pwcdataset url="https://paperswithcode.com/dataset/ace-2004">ACE 2004</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/ace-2005">ACE 2005</pwcdataset>
+      <pwcdataset url="https://paperswithcode.com/dataset/conll-1">CoNLL</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/conll-2003">CoNLL 2003</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/genia">GENIA</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/weibo-ner">Weibo NER</pwcdataset>
@@ -7340,6 +7343,7 @@
       <pwccode url="https://github.com/yhcc/BARTNER" additional="false">yhcc/BARTNER</pwccode>
       <pwcdataset url="https://paperswithcode.com/dataset/ace-2004">ACE 2004</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/ace-2005">ACE 2005</pwcdataset>
+      <pwcdataset url="https://paperswithcode.com/dataset/conll-1">CoNLL</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/conll-2003">CoNLL 2003</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/genia">GENIA</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/ontonotes-5-0">OntoNotes 5.0</pwcdataset>
@@ -8330,6 +8334,7 @@
       <doi>10.18653/v1/2021.acl-long.511</doi>
       <bibkey>colombo-etal-2021-novel</bibkey>
       <video href="2021.acl-long.511.mp4"/>
+      <pwcdataset url="https://paperswithcode.com/dataset/yelp">Yelp</pwcdataset>
     </paper>
     <paper id="512">
       <title>Determinantal Beam Search</title>
@@ -9368,6 +9373,7 @@
       <bibkey>kirstain-etal-2021-coreference</bibkey>
       <video href="2021.acl-short.3.mp4"/>
       <pwccode url="https://github.com/yuvalkirstain/s2e-coref" additional="false">yuvalkirstain/s2e-coref</pwccode>
+      <pwcdataset url="https://paperswithcode.com/dataset/conll-1">CoNLL</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/conll-2012-1">CoNLL-2012</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/gap-coreference-dataset">GAP Coreference Dataset</pwcdataset>
     </paper>
@@ -10628,6 +10634,7 @@
       <pwccode url="https://github.com/google-research-datasets/clang8" additional="true">google-research-datasets/clang8</pwccode>
       <pwcdataset url="https://paperswithcode.com/dataset/akces-gec">AKCES-GEC</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/c4">C4</pwcdataset>
+      <pwcdataset url="https://paperswithcode.com/dataset/conll-1">CoNLL</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/conll-2014-shared-task-grammatical-error">CoNLL-2014 Shared Task: Grammatical Error Correction</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/fce">FCE</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/mc4">mC4</pwcdataset>
diff --git a/data/xml/2021.eacl.xml b/data/xml/2021.eacl.xml
index 4147a71fd3..81b3e04927 100644
--- a/data/xml/2021.eacl.xml
+++ b/data/xml/2021.eacl.xml
@@ -584,6 +584,7 @@
       <doi>10.18653/v1/2021.eacl-main.40</doi>
       <pwccode url="https://github.com/ManojPrabhakar/CHOLAN" additional="false">ManojPrabhakar/CHOLAN</pwccode>
       <pwcdataset url="https://paperswithcode.com/dataset/aida-conll-yago">AIDA CoNLL-YAGO</pwcdataset>
+      <pwcdataset url="https://paperswithcode.com/dataset/conll-1">CoNLL</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/dbpedia">DBpedia</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/t-rex">T-REx</pwcdataset>
     </paper>
diff --git a/data/xml/2021.emnlp.xml b/data/xml/2021.emnlp.xml
index c9b76fc9d2..d93d349157 100644
--- a/data/xml/2021.emnlp.xml
+++ b/data/xml/2021.emnlp.xml
@@ -4067,7 +4067,7 @@
       <bibkey>zheng-etal-2021-allocating</bibkey>
       <doi>10.18653/v1/2021.emnlp-main.257</doi>
       <video href="2021.emnlp-main.257.mp4"/>
-      <pwccode url="https://github.com/bozheng-hit/vocapxlm" additional="false">bozheng-hit/vocapxlm</pwccode>
+      <pwccode url="https://github.com/bozheng-hit/vocapxlm" additional="true">bozheng-hit/vocapxlm</pwccode>
       <pwcdataset url="https://paperswithcode.com/dataset/mlqa">MLQA</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/paws-x">PAWS-X</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/tydi-qa">TyDiQA</pwcdataset>
@@ -6894,6 +6894,7 @@
       <doi>10.18653/v1/2021.emnlp-main.437</doi>
       <video href="2021.emnlp-main.437.mp4"/>
       <pwccode url="https://github.com/wzhouad/NLL-IE" additional="false">wzhouad/NLL-IE</pwccode>
+      <pwcdataset url="https://paperswithcode.com/dataset/conll-1">CoNLL</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/conll-2003">CoNLL 2003</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/conll">CoNLL++</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/tacred">TACRED</pwcdataset>
@@ -9557,6 +9558,7 @@
       <video href="2021.emnlp-main.604.mp4"/>
       <pwccode url="https://github.com/nicola-decao/efficient-autoregressive-EL" additional="false">nicola-decao/efficient-autoregressive-EL</pwccode>
       <pwcdataset url="https://paperswithcode.com/dataset/aida-conll-yago">AIDA CoNLL-YAGO</pwcdataset>
+      <pwcdataset url="https://paperswithcode.com/dataset/conll-1">CoNLL</pwcdataset>
     </paper>
     <paper id="605">
       <title>Word-Level Coreference Resolution</title>
@@ -9568,6 +9570,7 @@
       <doi>10.18653/v1/2021.emnlp-main.605</doi>
       <video href="2021.emnlp-main.605.mp4"/>
       <pwccode url="https://github.com/vdobrovolskii/wl-coref" additional="false">vdobrovolskii/wl-coref</pwccode>
+      <pwcdataset url="https://paperswithcode.com/dataset/conll-1">CoNLL</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/conll-2012-1">CoNLL-2012</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/ontonotes-5-0">OntoNotes 5.0</pwcdataset>
     </paper>
@@ -9669,6 +9672,7 @@
       <doi>10.18653/v1/2021.emnlp-main.611</doi>
       <video href="2021.emnlp-main.611.mp4"/>
       <pwccode url="https://github.com/michiyasunaga/LM-Critic" additional="true">michiyasunaga/LM-Critic</pwccode>
+      <pwcdataset url="https://paperswithcode.com/dataset/conll-1">CoNLL</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/conll-2014-shared-task-grammatical-error">CoNLL-2014 Shared Task: Grammatical Error Correction</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/gmeg-wiki">GMEG-wiki</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/gmeg-yahoo">GMEG-yahoo</pwcdataset>
@@ -11394,6 +11398,7 @@
       <pwccode url="https://github.com/IBM/yaso-tsa" additional="true">IBM/yaso-tsa</pwccode>
       <pwcdataset url="https://paperswithcode.com/dataset/yaso">YASO</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/sst">SST</pwcdataset>
+      <pwcdataset url="https://paperswithcode.com/dataset/yelp">Yelp</pwcdataset>
     </paper>
     <paper id="722">
       <title>An Empirical Study on Leveraging Position Embeddings for Target-oriented Opinion Words Extraction</title>
diff --git a/data/xml/2021.findings.xml b/data/xml/2021.findings.xml
index 341626a997..46523985a2 100644
--- a/data/xml/2021.findings.xml
+++ b/data/xml/2021.findings.xml
@@ -735,6 +735,7 @@
       <doi>10.18653/v1/2021.findings-acl.49</doi>
       <bibkey>fei-etal-2021-better</bibkey>
       <pwccode url="https://github.com/scofield7419/hesyfu" additional="false">scofield7419/hesyfu</pwccode>
+      <pwcdataset url="https://paperswithcode.com/dataset/conll-1">CoNLL</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/conll-2012-1">CoNLL-2012</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/ontonotes-5-0">OntoNotes 5.0</pwcdataset>
     </paper>
@@ -9588,6 +9589,7 @@
       <doi>10.18653/v1/2021.findings-emnlp.204</doi>
       <video href="2021.findings-emnlp.204.mp4"/>
       <pwcdataset url="https://paperswithcode.com/dataset/ade-corpus">Adverse Drug Events (ADE) Corpus</pwcdataset>
+      <pwcdataset url="https://paperswithcode.com/dataset/conll-1">CoNLL</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/conll04">CoNLL04</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/docred">DocRED</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/new-york-times-annotated-corpus">New York Times Annotated Corpus</pwcdataset>
@@ -9822,6 +9824,7 @@
       <pwcdataset url="https://paperswithcode.com/dataset/ace-2004">ACE 2004</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/aida-conll-yago">AIDA CoNLL-YAGO</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/aquaint">AQUAINT</pwcdataset>
+      <pwcdataset url="https://paperswithcode.com/dataset/conll-1">CoNLL</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/kilt">KILT</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/yago">YAGO</pwcdataset>
     </paper>
@@ -11433,6 +11436,7 @@
       <doi>10.18653/v1/2021.findings-emnlp.328</doi>
       <video href="2021.findings-emnlp.328.mp4"/>
       <pwccode url="https://github.com/megagonlabs/coop" additional="false">megagonlabs/coop</pwccode>
+      <pwcdataset url="https://paperswithcode.com/dataset/yelp">Yelp</pwcdataset>
     </paper>
     <paper id="329">
       <title>Using Optimal Transport as Alignment Objective for fine-tuning Multilingual Contextualized Embeddings</title>
diff --git a/data/xml/2021.iwslt.xml b/data/xml/2021.iwslt.xml
index 2232a8db99..a38c70e558 100644
--- a/data/xml/2021.iwslt.xml
+++ b/data/xml/2021.iwslt.xml
@@ -122,7 +122,6 @@
       <pwccode url="https://github.com/bytedance/neurst" additional="false">bytedance/neurst</pwccode>
       <pwcdataset url="https://paperswithcode.com/dataset/librispeech">LibriSpeech</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/must-c">MuST-C</pwcdataset>
-      <pwcdataset url="https://paperswithcode.com/dataset/ted-lium-3">TED-LIUM 3</pwcdataset>
     </paper>
     <paper id="7">
       <title><fixed-case>THE</fixed-case> <fixed-case>IWSLT</fixed-case> 2021 <fixed-case>BUT</fixed-case> <fixed-case>SPEECH</fixed-case> <fixed-case>TRANSLATION</fixed-case> <fixed-case>SYSTEMS</fixed-case></title>
@@ -183,6 +182,7 @@
       <bibkey>inaguma-etal-2021-espnet</bibkey>
       <pwcdataset url="https://paperswithcode.com/dataset/librispeech">LibriSpeech</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/must-c">MuST-C</pwcdataset>
+      <pwcdataset url="https://paperswithcode.com/dataset/ted-lium-3">TED-LIUM</pwcdataset>
     </paper>
     <paper id="11">
       <title>End-to-End Speech Translation with Pre-trained Models and Adapters: <fixed-case>UPC</fixed-case> at <fixed-case>IWSLT</fixed-case> 2021</title>
@@ -235,7 +235,6 @@
       <pwcdataset url="https://paperswithcode.com/dataset/how2">How2</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/librispeech">LibriSpeech</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/must-c">MuST-C</pwcdataset>
-      <pwcdataset url="https://paperswithcode.com/dataset/ted-lium-3">TED-LIUM 3</pwcdataset>
     </paper>
     <paper id="14">
       <title><fixed-case>FST</fixed-case>: the <fixed-case>FAIR</fixed-case> Speech Translation System for the <fixed-case>IWSLT</fixed-case>21 Multilingual Shared Task</title>
diff --git a/data/xml/2021.naacl.xml b/data/xml/2021.naacl.xml
index 48ad8a8d91..e285a0f27e 100644
--- a/data/xml/2021.naacl.xml
+++ b/data/xml/2021.naacl.xml
@@ -6603,6 +6603,7 @@
       <bibkey>liu-etal-2021-neural</bibkey>
       <video href="2021.naacl-main.429.mp4"/>
       <pwccode url="https://github.com/thunlp/VERNet" additional="false">thunlp/VERNet</pwccode>
+      <pwcdataset url="https://paperswithcode.com/dataset/conll-1">CoNLL</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/conll-2014-shared-task-grammatical-error">CoNLL-2014 Shared Task: Grammatical Error Correction</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/fce">FCE</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/jfleg">JFLEG</pwcdataset>
diff --git a/data/xml/2021.ranlp.xml b/data/xml/2021.ranlp.xml
index bb7d9cb690..f8b59a27dd 100644
--- a/data/xml/2021.ranlp.xml
+++ b/data/xml/2021.ranlp.xml
@@ -1884,6 +1884,7 @@
       <abstract>Nowadays, social media platforms use classification models to cope with hate speech and abusive language. The problem of these models is their vulnerability to bias. A prevalent form of bias in hate speech and abusive language datasets is annotator bias caused by the annotator’s subjective perception and the complexity of the annotation task. In our paper, we develop a set of methods to measure annotator bias in abusive language datasets and to identify different perspectives on abusive language. We apply these methods to four different abusive language datasets. Our proposed approach supports annotation processes of such datasets and future research addressing different perspectives on the perception of abusive language.</abstract>
       <url hash="fe3fbb54">2021.ranlp-1.170</url>
       <bibkey>wich-etal-2021-investigating</bibkey>
+      <pwccode url="https://github.com/mawic/annotator-bias-abusive-language" additional="false">mawic/annotator-bias-abusive-language</pwccode>
     </paper>
     <paper id="171">
       <title>Rules Ruling Neural Networks - Neural vs. Rule-Based Grammar Checking for a Low Resource Language</title>
diff --git a/data/xml/2022.acl.xml b/data/xml/2022.acl.xml
index d8964b9bd7..0b2ef6ad26 100644
--- a/data/xml/2022.acl.xml
+++ b/data/xml/2022.acl.xml
@@ -1103,6 +1103,7 @@
       <pwccode url="https://github.com/tricktreat/piqn" additional="false">tricktreat/piqn</pwccode>
       <pwcdataset url="https://paperswithcode.com/dataset/ace-2004">ACE 2004</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/ace-2005">ACE 2005</pwcdataset>
+      <pwcdataset url="https://paperswithcode.com/dataset/conll-1">CoNLL</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/conll-2003">CoNLL 2003</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/few-nerd">Few-NERD</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/genia">GENIA</pwcdataset>
@@ -5442,6 +5443,7 @@ in the Case of Unambiguous Gender</title>
       <pwccode url="https://github.com/thunlp/pl-marker" additional="true">thunlp/pl-marker</pwccode>
       <pwcdataset url="https://paperswithcode.com/dataset/ace-2004">ACE 2004</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/ace-2005">ACE 2005</pwcdataset>
+      <pwcdataset url="https://paperswithcode.com/dataset/conll-1">CoNLL</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/conll-2003">CoNLL 2003</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/few-nerd">Few-NERD</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/ontonotes-5-0">OntoNotes 5.0</pwcdataset>
@@ -6891,6 +6893,7 @@ in the Case of Unambiguous Gender</title>
       <pwccode url="https://github.com/JiachengLi1995/UCTopic" additional="false">JiachengLi1995/UCTopic</pwccode>
       <pwcdataset url="https://paperswithcode.com/dataset/bc5cdr">BC5CDR</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/conll-2003">CoNLL 2003</pwcdataset>
+      <pwcdataset url="https://paperswithcode.com/dataset/google-local-review">Google Local review</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/kp20k">KP20k</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/kptimes">KPTimes</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/wnut-2017-emerging-and-rare-entity">WNUT 2017</pwcdataset>
@@ -7903,6 +7906,7 @@ in the Case of Unambiguous Gender</title>
       <pwccode url="https://github.com/syuoni/eznlp" additional="false">syuoni/eznlp</pwccode>
       <pwcdataset url="https://paperswithcode.com/dataset/ace-2004">ACE 2004</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/ace-2005">ACE 2005</pwcdataset>
+      <pwcdataset url="https://paperswithcode.com/dataset/conll-1">CoNLL</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/conll-2003">CoNLL 2003</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/conll">CoNLL++</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/msra-cn-ner">MSRA CN NER</pwcdataset>
diff --git a/data/xml/2022.coling.xml b/data/xml/2022.coling.xml
index c88dee98e8..77caed8c06 100644
--- a/data/xml/2022.coling.xml
+++ b/data/xml/2022.coling.xml
@@ -2548,6 +2548,7 @@
       <url hash="1d872680">2022.coling-1.191</url>
       <bibkey>wang-etal-2022-mrc</bibkey>
       <pwccode url="https://github.com/shannonai/mrc-srl" additional="false">shannonai/mrc-srl</pwccode>
+      <pwcdataset url="https://paperswithcode.com/dataset/conll-1">CoNLL</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/ontonotes-5-0">OntoNotes 5.0</pwcdataset>
     </paper>
     <paper id="192">
@@ -4948,6 +4949,7 @@
       <url hash="9f707354">2022.coling-1.370</url>
       <bibkey>zhang-etal-2022-semantic</bibkey>
       <pwccode url="https://github.com/yzhangcs/crfsrl" additional="false">yzhangcs/crfsrl</pwccode>
+      <pwcdataset url="https://paperswithcode.com/dataset/conll-1">CoNLL</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/conll-2012-1">CoNLL-2012</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/ontonotes-5-0">OntoNotes 5.0</pwcdataset>
     </paper>
diff --git a/data/xml/2022.findings.xml b/data/xml/2022.findings.xml
index ad968a6154..8ce376c705 100644
--- a/data/xml/2022.findings.xml
+++ b/data/xml/2022.findings.xml
@@ -1066,6 +1066,7 @@
       <pwccode url="https://github.com/cgraywang/deepstruct" additional="false">cgraywang/deepstruct</pwccode>
       <pwcdataset url="https://paperswithcode.com/dataset/ace-2005">ACE 2005</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/atis">ATIS</pwcdataset>
+      <pwcdataset url="https://paperswithcode.com/dataset/conll-1">CoNLL</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/conll-2003">CoNLL 2003</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/conll">CoNLL++</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/conll04">CoNLL04</pwcdataset>
diff --git a/data/xml/2022.iwslt.xml b/data/xml/2022.iwslt.xml
index 28d386c363..136e4f4886 100644
--- a/data/xml/2022.iwslt.xml
+++ b/data/xml/2022.iwslt.xml
@@ -199,6 +199,7 @@
       <pwcdataset url="https://paperswithcode.com/dataset/librispeech">LibriSpeech</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/must-c">MuST-C</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/opensubtitles">OpenSubtitles</pwcdataset>
+      <pwcdataset url="https://paperswithcode.com/dataset/ted-lium-3">TED-LIUM</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/voxpopuli">VoxPopuli</pwcdataset>
     </paper>
     <paper id="12">
@@ -358,7 +359,6 @@
       <bibkey>wang-etal-2022-hw</bibkey>
       <doi>10.18653/v1/2022.iwslt-1.20</doi>
       <pwcdataset url="https://paperswithcode.com/dataset/librispeech">LibriSpeech</pwcdataset>
-      <pwcdataset url="https://paperswithcode.com/dataset/ted-lium-3">TED-LIUM 3</pwcdataset>
     </paper>
     <paper id="21">
       <title>The <fixed-case>HW</fixed-case>-<fixed-case>TSC</fixed-case>’s Simultaneous Speech Translation System for <fixed-case>IWSLT</fixed-case> 2022 Evaluation</title>
@@ -380,7 +380,6 @@
       <bibkey>wang-etal-2022-hw-tscs</bibkey>
       <doi>10.18653/v1/2022.iwslt-1.21</doi>
       <pwcdataset url="https://paperswithcode.com/dataset/librispeech">LibriSpeech</pwcdataset>
-      <pwcdataset url="https://paperswithcode.com/dataset/ted-lium-3">TED-LIUM 3</pwcdataset>
     </paper>
     <paper id="22">
       <title><fixed-case>MLLP</fixed-case>-<fixed-case>VRAIN</fixed-case> <fixed-case>UPV</fixed-case> systems for the <fixed-case>IWSLT</fixed-case> 2022 Simultaneous Speech Translation and Speech-to-Speech Translation tasks</title>
@@ -472,7 +471,6 @@
       <bibkey>guo-etal-2022-hw</bibkey>
       <doi>10.18653/v1/2022.iwslt-1.26</doi>
       <pwcdataset url="https://paperswithcode.com/dataset/librispeech">LibriSpeech</pwcdataset>
-      <pwcdataset url="https://paperswithcode.com/dataset/ted-lium-3">TED-LIUM 3</pwcdataset>
     </paper>
     <paper id="27">
       <title><fixed-case>CMU</fixed-case>’s <fixed-case>IWSLT</fixed-case> 2022 Dialect Speech Translation System</title>
diff --git a/data/xml/2022.lrec.xml b/data/xml/2022.lrec.xml
index 3b170fcff8..31c02f361e 100644
--- a/data/xml/2022.lrec.xml
+++ b/data/xml/2022.lrec.xml
@@ -9553,6 +9553,7 @@
       <url hash="723aed18">2022.lrec-1.772</url>
       <bibkey>tian-etal-2022-syntax</bibkey>
       <pwccode url="https://github.com/synlp/srl-mm" additional="false">synlp/srl-mm</pwccode>
+      <pwcdataset url="https://paperswithcode.com/dataset/conll-1">CoNLL</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/ontonotes-5-0">OntoNotes 5.0</pwcdataset>
     </paper>
     <paper id="773">
diff --git a/data/xml/2022.naacl.xml b/data/xml/2022.naacl.xml
index e4bc0a1e5e..d2d2d3891b 100644
--- a/data/xml/2022.naacl.xml
+++ b/data/xml/2022.naacl.xml
@@ -3383,6 +3383,7 @@
       <pwcdataset url="https://paperswithcode.com/dataset/ace-2004">ACE 2004</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/aida-conll-yago">AIDA CoNLL-YAGO</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/aquaint">AQUAINT</pwcdataset>
+      <pwcdataset url="https://paperswithcode.com/dataset/conll-1">CoNLL</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/docred">DocRED</pwcdataset>
     </paper>
     <paper id="211">
@@ -3870,6 +3871,7 @@
       <pwcdataset url="https://paperswithcode.com/dataset/ace-2004">ACE 2004</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/aida-conll-yago">AIDA CoNLL-YAGO</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/aquaint">AQUAINT</pwcdataset>
+      <pwcdataset url="https://paperswithcode.com/dataset/conll-1">CoNLL</pwcdataset>
     </paper>
     <paper id="239">
       <title>Clues Before Answers: Generation-Enhanced Multiple-Choice <fixed-case>QA</fixed-case></title>
@@ -5463,7 +5465,7 @@
       <url hash="9611a489">2022.naacl-main.332</url>
       <bibkey>verma-etal-2022-chai</bibkey>
       <doi>10.18653/v1/2022.naacl-main.332</doi>
-      <pwccode url="https://github.com/siddharthverma314/chai-naacl-2022" additional="false">siddharthverma314/chai-naacl-2022</pwccode>
+      <pwccode url="https://github.com/siddharthverma314/chai-naacl-2022" additional="true">siddharthverma314/chai-naacl-2022</pwccode>
     </paper>
     <paper id="333">
       <title>Connecting the Dots between Audio and Text without Parallel Data through Visual Knowledge Transfer</title>
@@ -8409,6 +8411,7 @@
       <pwcdataset url="https://paperswithcode.com/dataset/ace-2004">ACE 2004</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/aida-conll-yago">AIDA CoNLL-YAGO</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/aquaint">AQUAINT</pwcdataset>
+      <pwcdataset url="https://paperswithcode.com/dataset/conll-1">CoNLL</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/ipm-nel">IPM NEL</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/webquestionssp">WebQuestionsSP</pwcdataset>
     </paper>
diff --git a/data/xml/2022.rocling.xml b/data/xml/2022.rocling.xml
index 61c860874f..4eb324047b 100644
--- a/data/xml/2022.rocling.xml
+++ b/data/xml/2022.rocling.xml
@@ -290,7 +290,6 @@
       <bibkey>wu-etal-2022-preliminary</bibkey>
       <language>zho</language>
       <pwcdataset url="https://paperswithcode.com/dataset/librispeech">LibriSpeech</pwcdataset>
-      <pwcdataset url="https://paperswithcode.com/dataset/ted-lium-3">TED-LIUM 3</pwcdataset>
     </paper>
     <paper id="23">
       <title>Clustering Issues in Civil Judgments for Recommending Similar Cases</title>
@@ -522,6 +521,7 @@
       <url hash="9da1abf0">2022.rocling-1.42</url>
       <bibkey>luo-etal-2022-ynu</bibkey>
       <language>zho</language>
+      <pwccode url="https://github.com/suntea233/ROCLING-2022" additional="false">suntea233/ROCLING-2022</pwccode>
     </paper>
     <paper id="43">
       <title><fixed-case>NERVE</fixed-case> at <fixed-case>ROCLING</fixed-case> 2022 Shared Task: A Comparison of Three Named Entity Recognition Frameworks Based on Language Model and Lexicon Approach</title>
diff --git a/data/xml/C18.xml b/data/xml/C18.xml
index c44572fb27..d8741c2bc9 100644
--- a/data/xml/C18.xml
+++ b/data/xml/C18.xml
@@ -1577,6 +1577,7 @@
       <abstract>Recent advances in language modeling using recurrent neural networks have made it viable to model language as distributions over characters. By learning to predict the next character on the basis of previous characters, such models have been shown to automatically internalize linguistic concepts such as words, sentences, subclauses and even sentiment. In this paper, we propose to leverage the internal states of a trained character language model to produce a novel type of word embedding which we refer to as contextual string embeddings. Our proposed embeddings have the distinct properties that they (a) are trained without any explicit notion of words and thus fundamentally model words as sequences of characters, and (b) are contextualized by their surrounding text, meaning that the same word will have different embeddings depending on its contextual use. We conduct a comparative evaluation against previous embeddings and find that our embeddings are highly useful for downstream tasks: across four classic sequence labeling tasks we consistently outperform the previous state-of-the-art. In particular, we significantly outperform previous work on English and German named entity recognition (NER), allowing us to report new state-of-the-art F1-scores on the CoNLL03 shared task. We release all code and pre-trained language models in a simple-to-use framework to the research community, to enable reproduction of these experiments and application of our proposed embeddings to other tasks: <url>https://github.com/zalandoresearch/flair</url></abstract>
       <url hash="ca518de5">C18-1139</url>
       <bibkey>akbik-etal-2018-contextual</bibkey>
+      <pwcdataset url="https://paperswithcode.com/dataset/conll-1">CoNLL</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/conll-2003">CoNLL 2003</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/conll-2000-1">CoNLL-2000</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/penn-treebank">Penn Treebank</pwcdataset>
@@ -1762,6 +1763,7 @@
       <pwccode url="https://github.com/lukecq1231/generalized-pooling" additional="false">lukecq1231/generalized-pooling</pwccode>
       <pwcdataset url="https://paperswithcode.com/dataset/multinli">MultiNLI</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/snli">SNLI</pwcdataset>
+      <pwcdataset url="https://paperswithcode.com/dataset/yelp">Yelp</pwcdataset>
     </paper>
     <paper id="155">
       <title>Treat us like the sequences we are: Prepositional Paraphrasing of Noun Compounds using <fixed-case>LSTM</fixed-case></title>
@@ -1841,6 +1843,7 @@
       <abstract>Neural network approaches to Named-Entity Recognition reduce the need for carefully hand-crafted features. While some features do remain in state-of-the-art systems, lexical features have been mostly discarded, with the exception of gazetteers. In this work, we show that this is unfair: lexical features are actually quite useful. We propose to embed words and entity types into a low-dimensional vector space we train from annotated data produced by distant supervision thanks to Wikipedia. From this, we compute — offline — a feature vector representing each word. When used with a vanilla recurrent neural network model, this representation yields substantial improvements. We establish a new state-of-the-art F1 score of 87.95 on ONTONOTES 5.0, while matching state-of-the-art performance with a F1 score of 91.73 on the over-studied CONLL-2003 dataset.</abstract>
       <url hash="a6ffd855">C18-1161</url>
       <bibkey>ghaddar-langlais-2018-robust</bibkey>
+      <pwcdataset url="https://paperswithcode.com/dataset/conll-1">CoNLL</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/conll-2003">CoNLL 2003</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/dbpedia">DBpedia</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/ontonotes-5-0">OntoNotes 5.0</pwcdataset>
@@ -2887,6 +2890,7 @@
       <url hash="936c0ee2">C18-1250</url>
       <bibkey>yu-liu-2018-sliced</bibkey>
       <pwccode url="https://github.com/zepingyu0512/srnn" additional="true">zepingyu0512/srnn</pwccode>
+      <pwcdataset url="https://paperswithcode.com/dataset/yelp">Yelp</pwcdataset>
     </paper>
     <paper id="251">
       <title>Multi-Task Learning for Sequence Tagging: An Empirical Study</title>
diff --git a/data/xml/D11.xml b/data/xml/D11.xml
index 3f3ab018e1..bfaf60b1cd 100644
--- a/data/xml/D11.xml
+++ b/data/xml/D11.xml
@@ -691,6 +691,7 @@
       <url hash="20aa2f6a">D11-1072</url>
       <bibkey>hoffart-etal-2011-robust</bibkey>
       <pwcdataset url="https://paperswithcode.com/dataset/aida-conll-yago">AIDA CoNLL-YAGO</pwcdataset>
+      <pwcdataset url="https://paperswithcode.com/dataset/conll-1">CoNLL</pwcdataset>
     </paper>
     <paper id="73">
       <title>A Cascaded Classification Approach to Semantic Head Recognition</title>
diff --git a/data/xml/D14.xml b/data/xml/D14.xml
index 502596948b..4ade3a66a9 100644
--- a/data/xml/D14.xml
+++ b/data/xml/D14.xml
@@ -2126,6 +2126,7 @@
       <url hash="08591995">D14-1200</url>
       <doi>10.3115/v1/D14-1200</doi>
       <bibkey>miwa-sasaki-2014-modeling</bibkey>
+      <pwcdataset url="https://paperswithcode.com/dataset/conll-1">CoNLL</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/conll04">CoNLL04</pwcdataset>
     </paper>
     <paper id="201">
diff --git a/data/xml/D17.xml b/data/xml/D17.xml
index 905c0f53f8..3b1d2d0053 100644
--- a/data/xml/D17.xml
+++ b/data/xml/D17.xml
@@ -266,6 +266,7 @@
       <video href="https://vimeo.com/238232979"/>
       <bibkey>lee-etal-2017-end</bibkey>
       <pwccode url="https://github.com/kentonl/e2e-coref" additional="true">kentonl/e2e-coref</pwccode>
+      <pwcdataset url="https://paperswithcode.com/dataset/conll-1">CoNLL</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/conll-2012-1">CoNLL-2012</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/ontonotes-5-0">OntoNotes 5.0</pwcdataset>
     </paper>
@@ -2052,6 +2053,7 @@ and the code is available at <url>https://github.com/qizhex/RACE_AR_baselines</u
       <video href="https://vimeo.com/238232852"/>
       <bibkey>marcheggiani-titov-2017-encoding</bibkey>
       <pwccode url="https://github.com/diegma/neural-dep-srl" additional="true">diegma/neural-dep-srl</pwccode>
+      <pwcdataset url="https://paperswithcode.com/dataset/conll-1">CoNLL</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/conll-2009">CoNLL-2009</pwcdataset>
     </paper>
     <paper id="160">
@@ -2335,6 +2337,7 @@ and the code is available at <url>https://github.com/qizhex/RACE_AR_baselines</u
       <abstract>Neural networks have shown promising results for relation extraction. State-of-the-art models cast the task as an end-to-end problem, solved incrementally using a local classifier. Yet previous work using statistical models have demonstrated that global optimization can achieve better performances compared to local classification. We build a globally optimized neural model for end-to-end relation extraction, proposing novel LSTM features in order to better learn context representations. In addition, we present a novel method to integrate syntactic information to facilitate global learning, yet requiring little background on syntactic grammars thus being easy to extend. Experimental results show that our proposed model is highly effective, achieving the best performances on two standard benchmarks.</abstract>
       <bibkey>zhang-etal-2017-end</bibkey>
       <pwcdataset url="https://paperswithcode.com/dataset/ace-2005">ACE 2005</pwcdataset>
+      <pwcdataset url="https://paperswithcode.com/dataset/conll-1">CoNLL</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/conll04">CoNLL04</pwcdataset>
     </paper>
     <paper id="183">
@@ -3551,6 +3554,7 @@ and <i>efficiency</i> of on-line policy optimization compared to other companion
       <pwcdataset url="https://paperswithcode.com/dataset/ace-2004">ACE 2004</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/aida-conll-yago">AIDA CoNLL-YAGO</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/aquaint">AQUAINT</pwcdataset>
+      <pwcdataset url="https://paperswithcode.com/dataset/conll-1">CoNLL</pwcdataset>
     </paper>
     <paper id="278">
       <title><fixed-case>M</fixed-case>in<fixed-case>IE</fixed-case>: Minimizing Facts in Open Information Extraction</title>
@@ -3587,8 +3591,8 @@ and <i>efficiency</i> of on-line policy optimization compared to other companion
       <doi>10.18653/v1/D17-1280</doi>
       <abstract>In domain-specific NER, due to insufficient labeled training data, deep models usually fail to behave normally. In this paper, we proposed a novel Neural Inductive TEaching framework (NITE) to transfer knowledge from existing domain-specific NER models into an arbitrary deep neural network in a teacher-student training manner. NITE is a general framework that builds upon transfer learning and multiple instance learning, which collaboratively not only transfers knowledge to a deep student network but also reduces the noise from teachers. NITE can help deep learning methods to effectively utilize existing resources (i.e., models, labeled and unlabeled data) in a small domain. The experiment resulted on Disease NER proved that without using any labeled data, NITE can significantly boost the performance of a CNN-bidirectional LSTM-CRF NER neural network nearly over 30% in terms of F1-score.</abstract>
       <bibkey>tang-etal-2017-nite</bibkey>
+      <pwcdataset url="https://paperswithcode.com/dataset/ncbi-disease-corpus">NCBI Datasets</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/ncbi-disease-1">NCBI Disease</pwcdataset>
-      <pwcdataset url="https://paperswithcode.com/dataset/ncbi-disease-corpus">NCBI Disease Corpus</pwcdataset>
     </paper>
     <paper id="281">
       <title>Speeding up Reinforcement Learning-based Information Extraction Training using Asynchronous Methods</title>
diff --git a/data/xml/D18.xml b/data/xml/D18.xml
index 1aaa19c42a..2d06a8d265 100644
--- a/data/xml/D18.xml
+++ b/data/xml/D18.xml
@@ -326,6 +326,7 @@
       <doi>10.18653/v1/D18-1020</doi>
       <bibkey>chen-etal-2018-variational</bibkey>
       <pwccode url="https://github.com/mingdachen/vsl" additional="false">mingdachen/vsl</pwccode>
+      <pwcdataset url="https://paperswithcode.com/dataset/conll-1">CoNLL</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/conll-2003">CoNLL 2003</pwcdataset>
     </paper>
     <paper id="21">
@@ -2077,6 +2078,7 @@
       <doi>10.18653/v1/D18-1153</doi>
       <bibkey>liu-etal-2018-efficient</bibkey>
       <pwccode url="https://github.com/LiyuanLucasLiu/LD-Net" additional="false">LiyuanLucasLiu/LD-Net</pwccode>
+      <pwcdataset url="https://paperswithcode.com/dataset/conll-1">CoNLL</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/conll-2003">CoNLL 2003</pwcdataset>
     </paper>
     <paper id="154">
@@ -2627,6 +2629,7 @@
       <doi>10.18653/v1/D18-1191</doi>
       <bibkey>ouchi-etal-2018-span</bibkey>
       <pwccode url="https://github.com/hiroki13/span-based-srl" additional="false">hiroki13/span-based-srl</pwccode>
+      <pwcdataset url="https://paperswithcode.com/dataset/conll-1">CoNLL</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/ontonotes-5-0">OntoNotes 5.0</pwcdataset>
     </paper>
     <paper id="192">
@@ -2891,6 +2894,7 @@
       <bibkey>shen-etal-2018-learning</bibkey>
       <pwcdataset url="https://paperswithcode.com/dataset/dbpedia">DBpedia</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/wikiqa">WikiQA</pwcdataset>
+      <pwcdataset url="https://paperswithcode.com/dataset/yelp">Yelp</pwcdataset>
     </paper>
     <paper id="211">
       <title>Deep Relevance Ranking Using Enhanced Document-Query Interactions</title>
@@ -2983,6 +2987,7 @@
       <bibkey>clark-etal-2018-semi</bibkey>
       <pwccode url="" additional="true"/>
       <pwcdataset url="https://paperswithcode.com/dataset/ccgbank">CCGbank</pwcdataset>
+      <pwcdataset url="https://paperswithcode.com/dataset/conll-1">CoNLL</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/conll-2003">CoNLL 2003</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/ontonotes-5-0">OntoNotes 5.0</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/penn-treebank">Penn Treebank</pwcdataset>
@@ -3831,6 +3836,7 @@
       <doi>10.18653/v1/D18-1274</doi>
       <bibkey>chollampatt-ng-2018-neural</bibkey>
       <pwccode url="https://github.com/nusnlp/neuqe" additional="false">nusnlp/neuqe</pwccode>
+      <pwcdataset url="https://paperswithcode.com/dataset/conll-1">CoNLL</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/conll-2014-shared-task-grammatical-error">CoNLL-2014 Shared Task: Grammatical Error Correction</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/fce">FCE</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/jfleg">JFLEG</pwcdataset>
@@ -3902,6 +3908,7 @@
       <abstract>Character-based neural models have recently proven very useful for many NLP tasks. However, there is a gap of sophistication between methods for learning representations of sentences and words. While, most character models for learning representations of sentences are deep and complex, models for learning representations of words are shallow and simple. Also, in spite of considerable research on learning character embeddings, it is still not clear which kind of architecture is the best for capturing character-to-word representations. To address these questions, we first investigate the gaps between methods for learning word and sentence representations. We conduct detailed experiments and comparisons on different state-of-the-art convolutional models, and also investigate the advantages and disadvantages of their constituents. Furthermore, we propose IntNet, a funnel-shaped wide convolutional neural architecture with no down-sampling for learning representations of the internal structure of words by composing their characters from limited, supervised training corpora. We evaluate our proposed model on six sequence labeling datasets, including named entity recognition, part-of-speech tagging, and syntactic chunking. Our in-depth analysis shows that IntNet significantly outperforms other character embedding models and obtains new state-of-the-art performance without relying on any external knowledge or resources.</abstract>
       <doi>10.18653/v1/D18-1279</doi>
       <bibkey>xin-etal-2018-learning</bibkey>
+      <pwcdataset url="https://paperswithcode.com/dataset/conll-1">CoNLL</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/conll-2003">CoNLL 2003</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/penn-treebank">Penn Treebank</pwcdataset>
     </paper>
@@ -4277,6 +4284,7 @@
       <pwccode url="https://github.com/bekou/multihead_joint_entity_relation_extraction" additional="false">bekou/multihead_joint_entity_relation_extraction</pwccode>
       <pwcdataset url="https://paperswithcode.com/dataset/ace-2004">ACE 2004</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/ade-corpus">Adverse Drug Events (ADE) Corpus</pwcdataset>
+      <pwcdataset url="https://paperswithcode.com/dataset/conll-1">CoNLL</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/conll04">CoNLL04</pwcdataset>
     </paper>
     <paper id="308">
@@ -4319,6 +4327,7 @@
       <doi>10.18653/v1/D18-1310</doi>
       <bibkey>wu-etal-2018-evaluating</bibkey>
       <pwccode url="https://github.com/minghao-wu/CRF-AE" additional="false">minghao-wu/CRF-AE</pwccode>
+      <pwcdataset url="https://paperswithcode.com/dataset/conll-1">CoNLL</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/conll-2003">CoNLL 2003</pwcdataset>
     </paper>
     <paper id="311">
@@ -7575,6 +7584,7 @@
       <doi>10.18653/v1/D18-1548</doi>
       <bibkey>strubell-etal-2018-linguistically</bibkey>
       <pwccode url="https://github.com/strubell/LISA" additional="false">strubell/LISA</pwccode>
+      <pwcdataset url="https://paperswithcode.com/dataset/conll-1">CoNLL</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/conll-2012-1">CoNLL-2012</pwcdataset>
     </paper>
     <paper id="549">
diff --git a/data/xml/D19.xml b/data/xml/D19.xml
index 3b0a80a8a8..bf538d90f9 100644
--- a/data/xml/D19.xml
+++ b/data/xml/D19.xml
@@ -88,6 +88,7 @@
       <bibkey>peters-etal-2019-knowledge</bibkey>
       <pwccode url="https://github.com/allenai/kb" additional="false">allenai/kb</pwccode>
       <pwcdataset url="https://paperswithcode.com/dataset/aida-conll-yago">AIDA CoNLL-YAGO</pwcdataset>
+      <pwcdataset url="https://paperswithcode.com/dataset/conll-1">CoNLL</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/semeval-2010-task-8">SemEval-2010 Task-8</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/tacred">TACRED</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/wic">WiC</pwcdataset>
@@ -401,6 +402,7 @@
       <bibkey>yang-etal-2019-learning</bibkey>
       <pwccode url="https://github.com/YoungXiyuan/DCA" additional="true">YoungXiyuan/DCA</pwccode>
       <pwcdataset url="https://paperswithcode.com/dataset/aida-conll-yago">AIDA CoNLL-YAGO</pwcdataset>
+      <pwcdataset url="https://paperswithcode.com/dataset/conll-1">CoNLL</pwcdataset>
     </paper>
     <paper id="27">
       <title>Open Event Extraction from Online Text using a Generative Adversarial Network</title>
@@ -1089,6 +1091,7 @@
       <doi>10.18653/v1/D19-1077</doi>
       <bibkey>wu-dredze-2019-beto</bibkey>
       <pwccode url="https://github.com/shijie-wu/crosslingual-nlp" additional="true">shijie-wu/crosslingual-nlp</pwccode>
+      <pwcdataset url="https://paperswithcode.com/dataset/conll-1">CoNLL</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/conll-2002">CoNLL 2002</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/mldoc">MLDoc</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/xnli">XNLI</pwcdataset>
@@ -1672,6 +1675,7 @@
       <doi>10.18653/v1/D19-1119</doi>
       <bibkey>kiyono-etal-2019-empirical</bibkey>
       <pwccode url="https://github.com/butsugiri/gec-pseudodata" additional="false">butsugiri/gec-pseudodata</pwccode>
+      <pwcdataset url="https://paperswithcode.com/dataset/conll-1">CoNLL</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/conll-2014-shared-task-grammatical-error">CoNLL-2014 Shared Task: Grammatical Error Correction</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/jfleg">JFLEG</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/locness-corpus">WI-LOCNESS</pwcdataset>
@@ -5090,6 +5094,7 @@
       <doi>10.18653/v1/D19-1367</doi>
       <bibkey>jiang-etal-2019-improved</bibkey>
       <pwccode url="https://github.com/jiangyingjunn/i-darts" additional="false">jiangyingjunn/i-darts</pwccode>
+      <pwcdataset url="https://paperswithcode.com/dataset/conll-1">CoNLL</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/conll-2003">CoNLL 2003</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/ptb">PTB Diagnostic ECG Database</pwcdataset>
     </paper>
@@ -5527,6 +5532,7 @@
       <doi>10.18653/v1/D19-1399</doi>
       <bibkey>jie-lu-2019-dependency</bibkey>
       <pwccode url="https://github.com/allanj/ner_with_dependency" additional="false">allanj/ner_with_dependency</pwccode>
+      <pwcdataset url="https://paperswithcode.com/dataset/conll-1">CoNLL</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/conll-2003">CoNLL 2003</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/ontonotes-5-0">OntoNotes 5.0</pwcdataset>
     </paper>
@@ -5620,6 +5626,7 @@
       <url hash="683f59e8">D19-1406</url>
       <doi>10.18653/v1/D19-1406</doi>
       <bibkey>tikhonov-etal-2019-style</bibkey>
+      <pwcdataset url="https://paperswithcode.com/dataset/yelp">Yelp</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/yelp-review-polarity">Yelp Review Polarity</pwcdataset>
     </paper>
     <paper id="407">
@@ -5769,6 +5776,7 @@
       <pwcdataset url="https://paperswithcode.com/dataset/ag-news">AG News</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/dbpedia">DBpedia</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/yahoo-answers">Yahoo! Answers</pwcdataset>
+      <pwcdataset url="https://paperswithcode.com/dataset/yelp">Yelp</pwcdataset>
     </paper>
     <paper id="418">
       <title>Don’t Take the Easy Way Out: Ensemble Based Methods for Avoiding Known Dataset Biases</title>
@@ -6029,6 +6037,7 @@
       <attachment hash="13bdc4d1">D19-1435.Attachment.pdf</attachment>
       <doi>10.18653/v1/D19-1435</doi>
       <bibkey>awasthi-etal-2019-parallel</bibkey>
+      <pwcdataset url="https://paperswithcode.com/dataset/conll-1">CoNLL</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/conll-2014-shared-task-grammatical-error">CoNLL-2014 Shared Task: Grammatical Error Correction</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/jfleg">JFLEG</pwcdataset>
     </paper>
@@ -7189,6 +7198,7 @@
       <bibkey>wang-etal-2019-crossweigh</bibkey>
       <pwccode url="https://github.com/ZihanWangKi/CrossWeigh" additional="false">ZihanWangKi/CrossWeigh</pwccode>
       <pwcdataset url="https://paperswithcode.com/dataset/conll">CoNLL++</pwcdataset>
+      <pwcdataset url="https://paperswithcode.com/dataset/conll-1">CoNLL</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/conll-2003">CoNLL 2003</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/wnut-2017-emerging-and-rare-entity">WNUT 2017</pwcdataset>
     </paper>
@@ -7482,6 +7492,7 @@
       <url hash="c855992a">D19-1539</url>
       <doi>10.18653/v1/D19-1539</doi>
       <bibkey>baevski-etal-2019-cloze</bibkey>
+      <pwcdataset url="https://paperswithcode.com/dataset/conll-1">CoNLL</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/conll-2003">CoNLL 2003</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/glue">GLUE</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/mrpc">MRPC</pwcdataset>
@@ -8161,6 +8172,7 @@
       <doi>10.18653/v1/D19-1588</doi>
       <bibkey>joshi-etal-2019-bert</bibkey>
       <pwccode url="https://github.com/mandarjoshi90/coref" additional="true">mandarjoshi90/coref</pwccode>
+      <pwcdataset url="https://paperswithcode.com/dataset/conll-1">CoNLL</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/conll-2012-1">CoNLL-2012</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/gap-coreference-dataset">GAP Coreference Dataset</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/ontonotes-5-0">OntoNotes 5.0</pwcdataset>
diff --git a/data/xml/E17.xml b/data/xml/E17.xml
index 169fb1720d..7f30040ccb 100644
--- a/data/xml/E17.xml
+++ b/data/xml/E17.xml
@@ -2076,6 +2076,7 @@
       <pwcdataset url="https://paperswithcode.com/dataset/dbpedia">DBpedia</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/yfcc100m">YFCC100M</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/yahoo-answers">Yahoo! Answers</pwcdataset>
+      <pwcdataset url="https://paperswithcode.com/dataset/yelp">Yelp</pwcdataset>
     </paper>
     <paper id="69">
       <title>Pulling Out the Stops: Rethinking Stopword Removal for Topic Models</title>
diff --git a/data/xml/K16.xml b/data/xml/K16.xml
index 374436a831..7b0a012cfc 100644
--- a/data/xml/K16.xml
+++ b/data/xml/K16.xml
@@ -284,6 +284,7 @@
       <doi>10.18653/v1/K16-1025</doi>
       <bibkey>yamada-etal-2016-joint</bibkey>
       <pwcdataset url="https://paperswithcode.com/dataset/aida-conll-yago">AIDA CoNLL-YAGO</pwcdataset>
+      <pwcdataset url="https://paperswithcode.com/dataset/conll-1">CoNLL</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/tac-2010">TAC 2010</pwcdataset>
     </paper>
     <paper id="26">
diff --git a/data/xml/K18.xml b/data/xml/K18.xml
index eea5560d7a..e95b12d41e 100644
--- a/data/xml/K18.xml
+++ b/data/xml/K18.xml
@@ -635,6 +635,7 @@
       <bibkey>kolitsas-etal-2018-end</bibkey>
       <pwccode url="https://github.com/dalab/end2end_neural_el" additional="false">dalab/end2end_neural_el</pwccode>
       <pwcdataset url="https://paperswithcode.com/dataset/aida-conll-yago">AIDA CoNLL-YAGO</pwcdataset>
+      <pwcdataset url="https://paperswithcode.com/dataset/conll-1">CoNLL</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/ipm-nel">IPM NEL</pwcdataset>
     </paper>
     <paper id="51">
diff --git a/data/xml/K19.xml b/data/xml/K19.xml
index 85cf92a38c..8c8d8caf0c 100644
--- a/data/xml/K19.xml
+++ b/data/xml/K19.xml
@@ -835,6 +835,7 @@
       <bibkey>broscheit-2019-investigating</bibkey>
       <pwccode url="https://github.com/samuelbroscheit/entity_knowledge_in_bert" additional="false">samuelbroscheit/entity_knowledge_in_bert</pwccode>
       <pwcdataset url="https://paperswithcode.com/dataset/aida-conll-yago">AIDA CoNLL-YAGO</pwcdataset>
+      <pwcdataset url="https://paperswithcode.com/dataset/conll-1">CoNLL</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/glue">GLUE</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/swag">SWAG</pwcdataset>
     </paper>
@@ -1345,6 +1346,7 @@
       <attachment hash="7df88661">K19-2002.Attachment.zip</attachment>
       <doi>10.18653/v1/K19-2002</doi>
       <bibkey>hershcovich-arviv-2019-tupa</bibkey>
+      <pwcdataset url="https://paperswithcode.com/dataset/conll-1">CoNLL</pwcdataset>
     </paper>
     <paper id="3">
       <title>The <fixed-case>ERG</fixed-case> at <fixed-case>MRP</fixed-case> 2019: Radically Compositional Semantic Dependencies</title>
@@ -1414,6 +1416,7 @@
       <attachment hash="81b13aa1">K19-2007.Attachment.pdf</attachment>
       <doi>10.18653/v1/K19-2007</doi>
       <bibkey>che-etal-2019-hit</bibkey>
+      <pwcdataset url="https://paperswithcode.com/dataset/conll-1">CoNLL</pwcdataset>
     </paper>
     <paper id="8">
       <title><fixed-case>SJTU</fixed-case> at <fixed-case>MRP</fixed-case> 2019: A Transition-Based Multi-Task Parser for Cross-Framework Meaning Representation Parsing</title>
diff --git a/data/xml/L16.xml b/data/xml/L16.xml
index 397ff95d1c..e21d23cab4 100644
--- a/data/xml/L16.xml
+++ b/data/xml/L16.xml
@@ -6376,7 +6376,7 @@
       <abstract>We present the first version of a corpus annotated for psychiatric disorders and their etiological factors. The paper describes the choice of text, annotated entities and events/relations as well as the annotation scheme and procedure applied. The corpus is featuring a selection of focus psychiatric disorders including depressive disorder, anxiety disorder, obsessive-compulsive disorder, phobic disorders and panic disorder. Etiological factors for these focus disorders are widespread and include genetic, physiological, sociological and environmental factors among others. Etiological events, including annotated evidence text, represent the interactions between their focus disorders and their etiological factors. Additionally to these core events, symptomatic and treatment events have been annotated. The current version of the corpus includes 175 scientific abstracts. All entities and events/relations have been manually annotated by domain experts and scores of inter-annotator agreement are presented. The aim of the corpus is to provide a first gold standard to support the development of biomedical text mining applications for the specific area of mental disorders which belong to the main contributors to the contemporary burden of disease.</abstract>
       <url hash="ecea0c87">L16-1590</url>
       <bibkey>ellendorff-etal-2016-psymine</bibkey>
-      <pwcdataset url="https://paperswithcode.com/dataset/ncbi-disease-corpus">NCBI Disease Corpus</pwcdataset>
+      <pwcdataset url="https://paperswithcode.com/dataset/ncbi-disease-corpus">NCBI Datasets</pwcdataset>
     </paper>
     <paper id="591">
       <title>An Empirical Exploration of Moral Foundations Theory in Partisan News Sources</title>
diff --git a/data/xml/N16.xml b/data/xml/N16.xml
index a345f0aaf5..aa20ca43a4 100644
--- a/data/xml/N16.xml
+++ b/data/xml/N16.xml
@@ -356,6 +356,7 @@
       <doi>10.18653/v1/N16-1030</doi>
       <bibkey>lample-etal-2016-neural</bibkey>
       <pwccode url="https://github.com/glample/tagger" additional="true">glample/tagger</pwccode>
+      <pwcdataset url="https://paperswithcode.com/dataset/conll-1">CoNLL</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/conll-2003">CoNLL 2003</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/conll">CoNLL++</pwcdataset>
     </paper>
diff --git a/data/xml/N18.xml b/data/xml/N18.xml
index d469910e03..fa3c74be44 100644
--- a/data/xml/N18.xml
+++ b/data/xml/N18.xml
@@ -761,6 +761,7 @@
       <video href="http://vimeo.com/276409294"/>
       <bibkey>junczys-dowmunt-etal-2018-approaching</bibkey>
       <pwccode url="https://github.com/grammatical/neural-naacl2018" additional="false">grammatical/neural-naacl2018</pwccode>
+      <pwcdataset url="https://paperswithcode.com/dataset/conll-1">CoNLL</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/conll-2014-shared-task-grammatical-error">CoNLL-2014 Shared Task: Grammatical Error Correction</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/fce">FCE</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/jfleg">JFLEG</pwcdataset>
@@ -1224,6 +1225,7 @@
       <doi>10.18653/v1/N18-1089</doi>
       <bibkey>yasunaga-etal-2018-robust</bibkey>
       <pwccode url="https://github.com/michiyasunaga/pos_adv" additional="false">michiyasunaga/pos_adv</pwccode>
+      <pwcdataset url="https://paperswithcode.com/dataset/conll-1">CoNLL</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/conll-2003">CoNLL 2003</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/conll-2000-1">CoNLL-2000</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/penn-treebank">Penn Treebank</pwcdataset>
@@ -2271,6 +2273,7 @@
       <video href="http://vimeo.com/277673016"/>
       <bibkey>radhakrishnan-etal-2018-elden</bibkey>
       <pwcdataset url="https://paperswithcode.com/dataset/aida-conll-yago">AIDA CoNLL-YAGO</pwcdataset>
+      <pwcdataset url="https://paperswithcode.com/dataset/conll-1">CoNLL</pwcdataset>
     </paper>
     <paper id="168">
       <title>Interpretable Charge Predictions for Criminal Cases: Learning to Generate Court Views from Fact Descriptions</title>
@@ -2301,6 +2304,7 @@
       <bibkey>li-etal-2018-delete</bibkey>
       <pwccode url="https://github.com/lijuncen/Sentiment-and-Style-Transfer" additional="true">lijuncen/Sentiment-and-Style-Transfer</pwccode>
       <pwcdataset url="https://paperswithcode.com/dataset/gyafc">GYAFC</pwcdataset>
+      <pwcdataset url="https://paperswithcode.com/dataset/yelp">Yelp</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/yelp2018">Yelp2018</pwcdataset>
     </paper>
     <paper id="170">
@@ -2735,6 +2739,7 @@
       <bibkey>peters-etal-2018-deep</bibkey>
       <pwccode url="" additional="true"/>
       <pwcdataset url="https://paperswithcode.com/dataset/acl-arc-1">ACL ARC</pwcdataset>
+      <pwcdataset url="https://paperswithcode.com/dataset/conll-1">CoNLL</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/conll-2003">CoNLL 2003</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/conll">CoNLL++</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/only-connect-wall-ocw-dataset">OCW</pwcdataset>
@@ -3370,6 +3375,7 @@
       <doi>10.18653/v1/N18-2046</doi>
       <video href="http://vimeo.com/276373827"/>
       <bibkey>grundkiewicz-junczys-dowmunt-2018-near</bibkey>
+      <pwcdataset url="https://paperswithcode.com/dataset/conll-1">CoNLL</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/conll-2014-shared-task-grammatical-error">CoNLL-2014 Shared Task: Grammatical Error Correction</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/jfleg">JFLEG</pwcdataset>
     </paper>
@@ -4169,6 +4175,7 @@
       <video href="http://vimeo.com/277672817"/>
       <bibkey>lee-etal-2018-higher</bibkey>
       <pwccode url="https://github.com/kentonl/e2e-coref" additional="true">kentonl/e2e-coref</pwccode>
+      <pwcdataset url="https://paperswithcode.com/dataset/conll-1">CoNLL</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/conll-2012-1">CoNLL-2012</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/ontonotes-5-0">OntoNotes 5.0</pwcdataset>
     </paper>
@@ -4280,6 +4287,7 @@
       <url hash="acf68ccf">N18-2117</url>
       <doi>10.18653/v1/N18-2117</doi>
       <bibkey>al-hanai-etal-2018-role</bibkey>
+      <pwcdataset url="https://paperswithcode.com/dataset/ted-lium-3">TED-LIUM</pwcdataset>
     </paper>
     <paper id="118">
       <title>Slot-Gated Modeling for Joint Slot Filling and Intent Prediction</title>
diff --git a/data/xml/N19.xml b/data/xml/N19.xml
index fb0bb93939..9ac30aa2a4 100644
--- a/data/xml/N19.xml
+++ b/data/xml/N19.xml
@@ -205,6 +205,7 @@
       <bibkey>zhao-etal-2019-improving</bibkey>
       <pwccode url="https://github.com/zhawe01/fairseq-gec" additional="true">zhawe01/fairseq-gec</pwccode>
       <pwcdataset url="https://paperswithcode.com/dataset/billion-word-benchmark">Billion Word Benchmark</pwcdataset>
+      <pwcdataset url="https://paperswithcode.com/dataset/conll-1">CoNLL</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/conll-2014-shared-task-grammatical-error">CoNLL-2014 Shared Task: Grammatical Error Correction</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/fce">FCE</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/jfleg">JFLEG</pwcdataset>
@@ -5556,6 +5557,7 @@
       <bibkey>adhikari-etal-2019-rethinking</bibkey>
       <pwcdataset url="https://paperswithcode.com/dataset/imdb-multi">IMDB-MULTI</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/reuters-21578">Reuters-21578</pwcdataset>
+      <pwcdataset url="https://paperswithcode.com/dataset/yelp">Yelp</pwcdataset>
     </paper>
     <paper id="409">
       <title>Pre-trained language model representations for language generation</title>
@@ -5777,6 +5779,7 @@
       <pwccode url="https://github.com/google-research/bert" additional="true">google-research/bert</pwccode>
       <pwcdataset url="https://paperswithcode.com/dataset/cped">CPED</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/cola">CoLA</pwcdataset>
+      <pwcdataset url="https://paperswithcode.com/dataset/conll-1">CoNLL</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/conll-2003">CoNLL 2003</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/coqa">CoQA</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/dbpedia">DBpedia</pwcdataset>
diff --git a/data/xml/P16.xml b/data/xml/P16.xml
index 45cd71b02e..8c0b12fd3e 100644
--- a/data/xml/P16.xml
+++ b/data/xml/P16.xml
@@ -1139,6 +1139,7 @@
       <doi>10.18653/v1/P16-1101</doi>
       <bibkey>ma-hovy-2016-end</bibkey>
       <pwccode url="" additional="true"/>
+      <pwcdataset url="https://paperswithcode.com/dataset/conll-1">CoNLL</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/conll-2003">CoNLL 2003</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/conll">CoNLL++</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/penn-treebank">Penn Treebank</pwcdataset>
@@ -1260,6 +1261,7 @@
       <url hash="061e4ad1">P16-1112</url>
       <doi>10.18653/v1/P16-1112</doi>
       <bibkey>rei-yannakoudakis-2016-compositional</bibkey>
+      <pwcdataset url="https://paperswithcode.com/dataset/conll-1">CoNLL</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/fce">FCE</pwcdataset>
     </paper>
     <paper id="113">
@@ -1271,6 +1273,7 @@
       <doi>10.18653/v1/P16-1113</doi>
       <bibkey>roth-lapata-2016-neural</bibkey>
       <pwccode url="https://github.com/microth/PathLSTM" additional="false">microth/PathLSTM</pwccode>
+      <pwcdataset url="https://paperswithcode.com/dataset/conll-1">CoNLL</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/conll-2009">CoNLL-2009</pwcdataset>
     </paper>
     <paper id="114">
@@ -2586,6 +2589,7 @@
       <attachment type="note" hash="b1c0f96b">P16-1228.Notes.pdf</attachment>
       <bibkey>hu-etal-2016-harnessing</bibkey>
       <pwccode url="" additional="true"/>
+      <pwcdataset url="https://paperswithcode.com/dataset/conll-1">CoNLL</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/conll-2003">CoNLL 2003</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/sst">SST</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/sst-2">SST-2</pwcdataset>
diff --git a/data/xml/P17.xml b/data/xml/P17.xml
index dae14c93c3..afa964dff4 100644
--- a/data/xml/P17.xml
+++ b/data/xml/P17.xml
@@ -628,6 +628,7 @@ two word-vectors results in a vector that is only a small angle away from the ve
       <video href="https://vimeo.com/234954784"/>
       <bibkey>he-etal-2017-deep</bibkey>
       <pwccode url="https://github.com/luheng/deep_srl" additional="false">luheng/deep_srl</pwccode>
+      <pwcdataset url="https://paperswithcode.com/dataset/conll-1">CoNLL</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/ontonotes-5-0">OntoNotes 5.0</pwcdataset>
     </paper>
     <paper id="45">
@@ -744,6 +745,7 @@ two word-vectors results in a vector that is only a small angle away from the ve
       <bibkey>johnson-zhang-2017-deep</bibkey>
       <pwcdataset url="https://paperswithcode.com/dataset/ag-news">AG News</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/dbpedia">DBpedia</pwcdataset>
+      <pwcdataset url="https://paperswithcode.com/dataset/yelp">Yelp</pwcdataset>
     </paper>
     <paper id="53">
       <title>Improved Neural Relation Detection for Knowledge Base Question Answering</title>
@@ -1292,6 +1294,7 @@ two word-vectors results in a vector that is only a small angle away from the ve
       <bibkey>iyer-etal-2017-learning</bibkey>
       <pwcdataset url="https://paperswithcode.com/dataset/atis">ATIS</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/imdb-movie-reviews">IMDb Movie Reviews</pwcdataset>
+      <pwcdataset url="https://paperswithcode.com/dataset/yelp">Yelp</pwcdataset>
     </paper>
     <paper id="90">
       <title>Joint Modeling of Content and Discourse Relations in Dialogues</title>
@@ -2253,6 +2256,7 @@ two word-vectors results in a vector that is only a small angle away from the ve
       <abstract>Pre-trained word embeddings learned from unlabeled text have become a standard component of neural network architectures for NLP tasks. However, in most cases, the recurrent network that operates on word-level representations to produce context sensitive representations is trained on relatively little labeled data. In this paper, we demonstrate a general semi-supervised approach for adding pretrained context embeddings from bidirectional language models to NLP systems and apply it to sequence labeling tasks. We evaluate our model on two standard datasets for named entity recognition (NER) and chunking, and in both cases achieve state of the art results, surpassing previous systems that use other forms of transfer or joint learning with additional labeled data and task specific gazetteers.</abstract>
       <bibkey>peters-etal-2017-semi</bibkey>
       <pwccode url="" additional="true"/>
+      <pwcdataset url="https://paperswithcode.com/dataset/conll-1">CoNLL</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/conll-2003">CoNLL 2003</pwcdataset>
     </paper>
     <paper id="162">
@@ -2716,6 +2720,7 @@ two word-vectors results in a vector that is only a small angle away from the ve
       <abstract>We propose a sequence labeling framework with a secondary training objective, learning to predict surrounding words for every word in the dataset. This language modeling objective incentivises the system to learn general-purpose patterns of semantic and syntactic composition, which are also useful for improving accuracy on different sequence labeling tasks. The architecture was evaluated on a range of datasets, covering the tasks of error detection in learner texts, named entity recognition, chunking and POS-tagging. The novel language modeling objective provided consistent performance improvements on every benchmark, without requiring any additional annotated or unannotated data.</abstract>
       <bibkey>rei-2017-semi</bibkey>
       <pwccode url="https://github.com/marekrei/sequence-labeler" additional="true">marekrei/sequence-labeler</pwccode>
+      <pwcdataset url="https://paperswithcode.com/dataset/conll-1">CoNLL</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/conll-2003">CoNLL 2003</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/fce">FCE</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/penn-treebank">Penn Treebank</pwcdataset>
diff --git a/data/xml/P18.xml b/data/xml/P18.xml
index 88205c5934..30390d5d12 100644
--- a/data/xml/P18.xml
+++ b/data/xml/P18.xml
@@ -483,6 +483,7 @@
       <attachment type="poster" hash="76675ee7">P18-1030.Poster.pdf</attachment>
       <doi>10.18653/v1/P18-1030</doi>
       <bibkey>zhang-etal-2018-sentence</bibkey>
+      <pwcdataset url="https://paperswithcode.com/dataset/conll-1">CoNLL</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/conll-2003">CoNLL 2003</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/imdb-movie-reviews">IMDb Movie Reviews</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/mr">MR</pwcdataset>
@@ -504,6 +505,7 @@
       <pwcdataset url="https://paperswithcode.com/dataset/imdb-movie-reviews">IMDb Movie Reviews</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/wikitext-103">WikiText-103</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/wikitext-2">WikiText-2</pwcdataset>
+      <pwcdataset url="https://paperswithcode.com/dataset/yelp">Yelp</pwcdataset>
     </paper>
     <paper id="32">
       <title>Evaluating neural network explanation methods using hybrid documents and morphosyntactic agreement</title>
@@ -538,6 +540,7 @@
       <pwcdataset url="https://paperswithcode.com/dataset/atis">ATIS</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/imdb-movie-reviews">IMDb Movie Reviews</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/wikisql">WikiSQL</pwcdataset>
+      <pwcdataset url="https://paperswithcode.com/dataset/yelp">Yelp</pwcdataset>
     </paper>
     <paper id="34">
       <title>Semantic Parsing with Syntax- and Table-Aware <fixed-case>SQL</fixed-case> Generation</title>
@@ -664,6 +667,7 @@
       <bibkey>shen-etal-2018-baseline</bibkey>
       <pwccode url="https://github.com/dinghanshen/SWEM" additional="true">dinghanshen/SWEM</pwccode>
       <pwcdataset url="https://paperswithcode.com/dataset/ag-news">AG News</pwcdataset>
+      <pwcdataset url="https://paperswithcode.com/dataset/conll-1">CoNLL</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/conll-2003">CoNLL 2003</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/conll-2000-1">CoNLL-2000</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/dbpedia">DBpedia</pwcdataset>
@@ -677,6 +681,7 @@
       <pwcdataset url="https://paperswithcode.com/dataset/subj">SUBJ</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/wikiqa">WikiQA</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/yahoo-answers">Yahoo! Answers</pwcdataset>
+      <pwcdataset url="https://paperswithcode.com/dataset/yelp">Yelp</pwcdataset>
     </paper>
     <paper id="42">
       <title><fixed-case>P</fixed-case>ara<fixed-case>NMT</fixed-case>-50<fixed-case>M</fixed-case>: Pushing the Limits of Paraphrastic Sentence Embeddings with Millions of Machine Translations</title>
@@ -1219,6 +1224,7 @@
       <bibkey>prabhumoye-etal-2018-style</bibkey>
       <pwccode url="https://github.com/shrimai/Style-Transfer-Through-Back-Translation" additional="true">shrimai/Style-Transfer-Through-Back-Translation</pwccode>
       <pwcdataset url="https://paperswithcode.com/dataset/gyafc">GYAFC</pwcdataset>
+      <pwcdataset url="https://paperswithcode.com/dataset/yelp">Yelp</pwcdataset>
     </paper>
     <paper id="81">
       <title>Generating Fine-Grained Open Vocabulary Entity Type Descriptions</title>
@@ -1375,6 +1381,7 @@
       <bibkey>xu-etal-2018-unpaired</bibkey>
       <pwccode url="https://github.com/lancopku/unpaired-sentiment-translation" additional="false">lancopku/unpaired-sentiment-translation</pwccode>
       <pwcdataset url="https://paperswithcode.com/dataset/gyafc">GYAFC</pwcdataset>
+      <pwcdataset url="https://paperswithcode.com/dataset/yelp">Yelp</pwcdataset>
     </paper>
     <paper id="91">
       <title>Discourse Marker Augmented Network with Reinforcement Learning for Natural Language Inference</title>
@@ -3253,6 +3260,7 @@
       <pwcdataset url="https://paperswithcode.com/dataset/ag-news">AG News</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/dbpedia">DBpedia</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/yahoo-answers">Yahoo! Answers</pwcdataset>
+      <pwcdataset url="https://paperswithcode.com/dataset/yelp">Yelp</pwcdataset>
     </paper>
     <paper id="216">
       <title>Joint Embedding of Words and Labels for Text Classification</title>
@@ -3274,6 +3282,7 @@
       <pwcdataset url="https://paperswithcode.com/dataset/ag-news">AG News</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/dbpedia">DBpedia</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/yahoo-answers">Yahoo! Answers</pwcdataset>
+      <pwcdataset url="https://paperswithcode.com/dataset/yelp">Yelp</pwcdataset>
     </paper>
     <paper id="217">
       <title>Neural Sparse Topical Coding</title>
@@ -4397,6 +4406,7 @@
       <doi>10.18653/v1/P18-2038</doi>
       <bibkey>ye-ling-2018-hybrid</bibkey>
       <pwccode url="https://github.com/ZhixiuYe/HSCRF-pytorch" additional="false">ZhixiuYe/HSCRF-pytorch</pwccode>
+      <pwcdataset url="https://paperswithcode.com/dataset/conll-1">CoNLL</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/conll-2003">CoNLL 2003</pwcdataset>
     </paper>
     <paper id="39">
@@ -4665,6 +4675,7 @@
       <doi>10.18653/v1/P18-2058</doi>
       <bibkey>he-etal-2018-jointly</bibkey>
       <pwccode url="https://github.com/luheng/lsgn" additional="false">luheng/lsgn</pwccode>
+      <pwcdataset url="https://paperswithcode.com/dataset/conll-1">CoNLL</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/conll-2012-1">CoNLL-2012</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/ontonotes-5-0">OntoNotes 5.0</pwcdataset>
     </paper>
@@ -6047,6 +6058,7 @@
       <doi>10.18653/v1/P18-4013</doi>
       <bibkey>yang-zhang-2018-ncrf</bibkey>
       <pwccode url="https://github.com/jiesutd/NCRFpp" additional="true">jiesutd/NCRFpp</pwccode>
+      <pwcdataset url="https://paperswithcode.com/dataset/conll-1">CoNLL</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/conll-2003">CoNLL 2003</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/penn-treebank">Penn Treebank</pwcdataset>
     </paper>
diff --git a/data/xml/P19.xml b/data/xml/P19.xml
index 7df677e1ea..b17c8aab5d 100644
--- a/data/xml/P19.xml
+++ b/data/xml/P19.xml
@@ -877,6 +877,7 @@
       <url hash="a7ebc2ee">P19-1064</url>
       <doi>10.18653/v1/P19-1064</doi>
       <bibkey>fei-etal-2019-end</bibkey>
+      <pwcdataset url="https://paperswithcode.com/dataset/conll-1">CoNLL</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/conll-2012-1">CoNLL-2012</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/ontonotes-5-0">OntoNotes 5.0</pwcdataset>
     </paper>
@@ -904,6 +905,7 @@
       <url hash="b6923be4">P19-1066</url>
       <doi>10.18653/v1/P19-1066</doi>
       <bibkey>kantor-globerson-2019-coreference</bibkey>
+      <pwcdataset url="https://paperswithcode.com/dataset/conll-1">CoNLL</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/conll-2012-1">CoNLL-2012</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/ontonotes-5-0">OntoNotes 5.0</pwcdataset>
     </paper>
@@ -1819,6 +1821,7 @@
       <bibkey>li-etal-2019-entity</bibkey>
       <pwcdataset url="https://paperswithcode.com/dataset/ace-2004">ACE 2004</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/ace-2005">ACE 2005</pwcdataset>
+      <pwcdataset url="https://paperswithcode.com/dataset/conll-1">CoNLL</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/conll04">CoNLL04</pwcdataset>
     </paper>
     <paper id="130">
@@ -1955,6 +1958,7 @@
       <bibkey>xia-etal-2019-multi</bibkey>
       <pwcdataset url="https://paperswithcode.com/dataset/ace-2004">ACE 2004</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/ace-2005">ACE 2005</pwcdataset>
+      <pwcdataset url="https://paperswithcode.com/dataset/conll-1">CoNLL</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/conll-2003">CoNLL 2003</pwcdataset>
     </paper>
     <paper id="139">
@@ -2667,6 +2671,7 @@
       <bibkey>le-titov-2019-boosting</bibkey>
       <pwccode url="https://github.com/lephong/wnel" additional="false">lephong/wnel</pwccode>
       <pwcdataset url="https://paperswithcode.com/dataset/aida-conll-yago">AIDA CoNLL-YAGO</pwcdataset>
+      <pwcdataset url="https://paperswithcode.com/dataset/conll-1">CoNLL</pwcdataset>
     </paper>
     <paper id="188">
       <title>Pre-Learning Environment Representations for Data-Efficient Neural Instruction Following</title>
@@ -3344,6 +3349,7 @@
       <doi>10.18653/v1/P19-1233</doi>
       <bibkey>liu-etal-2019-gcdt</bibkey>
       <pwccode url="https://github.com/Adaxry/GCDT" additional="false">Adaxry/GCDT</pwccode>
+      <pwcdataset url="https://paperswithcode.com/dataset/conll-1">CoNLL</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/conll-2003">CoNLL 2003</pwcdataset>
     </paper>
     <paper id="234">
@@ -4256,6 +4262,7 @@
       <doi>10.18653/v1/P19-1299</doi>
       <bibkey>chen-etal-2019-multi-source</bibkey>
       <pwccode url="https://github.com/microsoft/Multilingual-Model-Transfer" additional="false">microsoft/Multilingual-Model-Transfer</pwccode>
+      <pwcdataset url="https://paperswithcode.com/dataset/conll-1">CoNLL</pwcdataset>
     </paper>
     <paper id="300">
       <title>Unsupervised Multilingual Word Embedding with Limited Resources using Neural Language Models</title>
@@ -7440,6 +7447,7 @@
       <doi>10.18653/v1/P19-1524</doi>
       <bibkey>liu-etal-2019-towards</bibkey>
       <pwccode url="https://github.com/lyutyuh/acl19_subtagger" additional="false">lyutyuh/acl19_subtagger</pwccode>
+      <pwcdataset url="https://paperswithcode.com/dataset/conll-1">CoNLL</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/conll-2003">CoNLL 2003</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/ontonotes-5-0">OntoNotes 5.0</pwcdataset>
     </paper>
@@ -7478,6 +7486,7 @@
       <bibkey>strakova-etal-2019-neural</bibkey>
       <pwcdataset url="https://paperswithcode.com/dataset/ace-2004">ACE 2004</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/ace-2005">ACE 2005</pwcdataset>
+      <pwcdataset url="https://paperswithcode.com/dataset/conll-1">CoNLL</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/conll-2002">CoNLL 2002</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/conll-2003">CoNLL 2003</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/genia">GENIA</pwcdataset>
@@ -7545,6 +7554,7 @@
       <url hash="76c69e20">P19-1532</url>
       <doi>10.18653/v1/P19-1532</doi>
       <bibkey>liu-etal-2019-prism</bibkey>
+      <pwcdataset url="https://paperswithcode.com/dataset/conll-1">CoNLL</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/conll-2003">CoNLL 2003</pwcdataset>
     </paper>
     <paper id="533">
@@ -9611,6 +9621,7 @@
       <doi>10.18653/v1/P19-2026</doi>
       <bibkey>martins-etal-2019-joint</bibkey>
       <pwcdataset url="https://paperswithcode.com/dataset/aida-conll-yago">AIDA CoNLL-YAGO</pwcdataset>
+      <pwcdataset url="https://paperswithcode.com/dataset/conll-1">CoNLL</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/conll-2003">CoNLL 2003</pwcdataset>
     </paper>
     <paper id="27">
diff --git a/data/xml/Q16.xml b/data/xml/Q16.xml
index dd1f84fb1f..eec0a814ad 100644
--- a/data/xml/Q16.xml
+++ b/data/xml/Q16.xml
@@ -327,6 +327,7 @@
       <url hash="c1db0998">Q16-1026</url>
       <bibkey>chiu-nichols-2016-named</bibkey>
       <pwccode url="" additional="true"/>
+      <pwcdataset url="https://paperswithcode.com/dataset/conll-1">CoNLL</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/conll-2003">CoNLL 2003</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/dbpedia">DBpedia</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/ontonotes-5-0">OntoNotes 5.0</pwcdataset>
diff --git a/data/xml/Q17.xml b/data/xml/Q17.xml
index af092ee261..5608fcd500 100644
--- a/data/xml/Q17.xml
+++ b/data/xml/Q17.xml
@@ -392,6 +392,7 @@
       <bibkey>yamada-etal-2017-learning</bibkey>
       <pwccode url="https://github.com/studio-ousia/ntee" additional="false">studio-ousia/ntee</pwccode>
       <pwcdataset url="https://paperswithcode.com/dataset/aida-conll-yago">AIDA CoNLL-YAGO</pwcdataset>
+      <pwcdataset url="https://paperswithcode.com/dataset/conll-1">CoNLL</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/sick">SICK</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/tac-2010">TAC 2010</pwcdataset>
     </paper>
diff --git a/data/xml/S14.xml b/data/xml/S14.xml
index bd5db1a7ab..3708e5a45b 100644
--- a/data/xml/S14.xml
+++ b/data/xml/S14.xml
@@ -469,7 +469,7 @@
       <url hash="17ef2ae4">S14-2019</url>
       <doi>10.3115/v1/S14-2019</doi>
       <bibkey>matos-etal-2014-bioinformaticsua</bibkey>
-      <pwcdataset url="https://paperswithcode.com/dataset/ncbi-disease-corpus">NCBI Disease Corpus</pwcdataset>
+      <pwcdataset url="https://paperswithcode.com/dataset/ncbi-disease-corpus">NCBI Datasets</pwcdataset>
     </paper>
     <paper id="20">
       <title><fixed-case>B</fixed-case>linov: Distributed Representations of Words for Aspect-Based Sentiment Analysis at <fixed-case>S</fixed-case>em<fixed-case>E</fixed-case>val 2014</title>
diff --git a/data/xml/W12.xml b/data/xml/W12.xml
index 2ef3347f30..aee10efe94 100644
--- a/data/xml/W12.xml
+++ b/data/xml/W12.xml
@@ -3437,7 +3437,6 @@
       <pages>91–99</pages>
       <url hash="d1861df2">W12-2411</url>
       <bibkey>islamaj-dogan-lu-2012-improved</bibkey>
-      <pwcdataset url="https://paperswithcode.com/dataset/ncbi-disease-corpus">NCBI Disease Corpus</pwcdataset>
     </paper>
     <paper id="12">
       <title>New Resources and Perspectives for Biomedical Event Extraction</title>
diff --git a/data/xml/W14.xml b/data/xml/W14.xml
index 2bafba5936..ce6666d790 100644
--- a/data/xml/W14.xml
+++ b/data/xml/W14.xml
@@ -6029,8 +6029,8 @@
       <url hash="56f0fc1d">W14-3404</url>
       <doi>10.3115/v1/W14-3404</doi>
       <bibkey>leaman-lu-2014-automated</bibkey>
+      <pwcdataset url="https://paperswithcode.com/dataset/ncbi-disease-corpus">NCBI Datasets</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/ncbi-disease-1">NCBI Disease</pwcdataset>
-      <pwcdataset url="https://paperswithcode.com/dataset/ncbi-disease-corpus">NCBI Disease Corpus</pwcdataset>
     </paper>
     <paper id="5">
       <title>Decomposing Consumer Health Questions</title>
diff --git a/data/xml/W17.xml b/data/xml/W17.xml
index bf834b9796..c30c213c61 100644
--- a/data/xml/W17.xml
+++ b/data/xml/W17.xml
@@ -9875,6 +9875,7 @@ is able to handle phenomena related to scope by means of an higher-order type th
       <doi>10.18653/v1/W17-5004</doi>
       <abstract>We investigate the utility of different auxiliary objectives and training strategies within a neural sequence labeling approach to error detection in learner writing. Auxiliary costs provide the model with additional linguistic information, allowing it to learn general-purpose compositional features that can then be exploited for other objectives. Our experiments show that a joint learning approach trained with parallel labels on in-domain data improves performance over the previous best error detection system. While the resulting model has the same number of parameters, the additional objectives allow it to be optimised more efficiently and achieve better performance.</abstract>
       <bibkey>rei-yannakoudakis-2017-auxiliary</bibkey>
+      <pwcdataset url="https://paperswithcode.com/dataset/conll-1">CoNLL</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/conll-2003">CoNLL 2003</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/fce">FCE</pwcdataset>
     </paper>
@@ -10206,6 +10207,7 @@ is able to handle phenomena related to scope by means of an higher-order type th
       <doi>10.18653/v1/W17-5032</doi>
       <abstract>Shortage of available training data is holding back progress in the area of automated error detection. This paper investigates two alternative methods for artificially generating writing errors, in order to create additional resources. We propose treating error generation as a machine translation task, where grammatically correct text is translated to contain errors. In addition, we explore a system for extracting textual patterns from an annotated corpus, which can then be used to insert errors into grammatically correct sentences. Our experiments show that the inclusion of artificially generated errors significantly improves error detection accuracy on both FCE and CoNLL 2014 datasets.</abstract>
       <bibkey>rei-etal-2017-artificial</bibkey>
+      <pwcdataset url="https://paperswithcode.com/dataset/conll-1">CoNLL</pwcdataset>
       <pwcdataset url="https://paperswithcode.com/dataset/fce">FCE</pwcdataset>
     </paper>
     <paper id="33">
diff --git a/data/xml/W18.xml b/data/xml/W18.xml
index 780f93653c..b1383c162a 100644
--- a/data/xml/W18.xml
+++ b/data/xml/W18.xml
@@ -10969,7 +10969,7 @@
       <bibkey>tourille-etal-2018-evaluation</bibkey>
       <pwccode url="https://github.com/strayMat/bio-medical_ner" additional="false">strayMat/bio-medical_ner</pwccode>
       <pwcdataset url="https://paperswithcode.com/dataset/conll-2003">CoNLL 2003</pwcdataset>
-      <pwcdataset url="https://paperswithcode.com/dataset/ncbi-disease-corpus">NCBI Disease Corpus</pwcdataset>
+      <pwcdataset url="https://paperswithcode.com/dataset/ncbi-disease-corpus">NCBI Datasets</pwcdataset>
     </paper>
     <paper id="23">
       <title>Learning to Summarize Radiology Findings</title>
diff --git a/data/xml/W19.xml b/data/xml/W19.xml
index 70071e390d..e15fa497a6 100644
--- a/data/xml/W19.xml
+++ b/data/xml/W19.xml
@@ -14138,6 +14138,7 @@ One of the references was wrong therefore it is corrected to cite the appropriat
       <url hash="9b228715">W19-5945</url>
       <doi>10.18653/v1/W19-5945</doi>
       <bibkey>keizer-etal-2019-user</bibkey>
+      <pwccode url="https://bitbucket.org/skeizer/madrigal" additional="false">skeizer/madrigal</pwccode>
     </paper>
     <paper id="46">
       <title>Dialogue Act Classification in Team Communication for Robot Assisted Disaster Response</title>