From 06308c8ba0bb345ab2c4c4c3b6f29220867cca9d Mon Sep 17 00:00:00 2001
From: Anthony Platanios <e.a.platanios@gmail.com>
Date: Sat, 13 Jan 2024 15:20:23 -0800
Subject: [PATCH] Added DOI information.

---
 _bibliography/papers.bib  | 50 +++++++++++++++++++++++++++------------
 _layouts/default.html     |  3 +++
 _layouts/publication.html | 10 ++++++++
 3 files changed, 48 insertions(+), 15 deletions(-)

diff --git a/_bibliography/papers.bib b/_bibliography/papers.bib
index a0e449fc2abf..3fb921d1bc6a 100644
--- a/_bibliography/papers.bib
+++ b/_bibliography/papers.bib
@@ -10,6 +10,7 @@ @inproceedings{StengelEskin:2022:troubling_quirk
   abstract      = {In natural language understanding (NLU) production systems, users' evolving needs necessitate the addition of new features over time, indexed by new symbols added to the meaning representation space. This requires additional training data and results in ever-growing datasets. We present the first systematic investigation into this incremental symbol learning scenario. Our analyses reveal a troubling quirk in building (broad-coverage) NLU systems: as the training dataset grows, more data is needed to learn new symbols, forming a vicious cycle. We show that this trend holds for multiple mainstream models on two common NLU tasks: intent recognition and semantic parsing. Rejecting class imbalance as the sole culprit, we reveal that the trend is closely associated with an effect we call source signal dilution, where strong lexical cues for the new symbol become diluted as the training dataset grows. Selectively dropping training examples to prevent dilution often reverses the trend, showing the over-reliance of mainstream neural NLU models on simple lexical cues and their lack of contextual understanding.},
   pdf           = {stengel_eskin_2022_troubling_quirk/paper.pdf},
   code          = {https://github.com/microsoft/nlu-incremental-symbol-learning},
+  doi           = {10.18653/v1/2022.emnlp-main.789},
 }
 
 @inproceedings{Zhou:2022:online_parsing,
@@ -23,6 +24,7 @@ @inproceedings{Zhou:2022:online_parsing
   pdf           = {zhou_2022_online_parsing/paper.pdf},
   code          = {https://github.com/microsoft/online-semantic-parsing-for-latency-reduction},
   note          = {{Outstanding Paper Award}},
+  doi           = {10.18653/v1/2022.acl-long.110},
 }
 
 @inproceedings{Chen:2022:text_to_sql,
@@ -35,6 +37,7 @@ @inproceedings{Chen:2022:text_to_sql
   abstract      = {Text-to-SQL parsers map natural language questions to programs that are executable over tables to generate answers, and are typically evaluated on large-scale datasets like Spider (Yu et al., 2018). We argue that existing benchmarks fail to capture a certain out-of-domain generalization problem that is of significant practical importance: matching domain specific phrases to composite operation over columns. To study this problem, we first propose a synthetic dataset along with a re-purposed train/test split of the Squall dataset (Shi et al., 2020) as new benchmarks to quantify domain generalization over column operations, and find existing state-of-the-art parsers struggle in these benchmarks. We propose to address this problem by incorporating prior domain knowledge by preprocessing table schemas, and design a method that consists of two components: schema expansion and schema pruning. This method can be easily applied to multiple existing base parsers, and we show that it significantly outperforms baseline parsers on this domain generalization problem, boosting the underlying parsers’ overall performance by up to 13.8% relative accuracy gain (5.1% absolute) on the new Squall data split.},
   pdf           = {chen_2022_text_to_sql/paper.pdf},
   code          = {https://github.com/microsoft/text-to-sql-schema-expansion-generalization},
+  doi           = {10.18653/v1/2022.acl-long.381},
 }
 
 @inproceedings{Belyy:2022:k_best,
@@ -46,6 +49,7 @@ @inproceedings{Belyy:2022:k_best
   year          = {2022},
   abstract      = {Collecting data for conversational semantic parsing is a time-consuming and demanding process. In this paper we consider, given an incomplete dataset with only a small amount of data, how to build an AI-powered human-in-the-loop process to enable efficient data collection. A guided K-best selection process is proposed, which (i) generates a set of possible valid candidates; (ii) allows users to quickly traverse the set and filter incorrect parses; and (iii) asks users to select the correct parse, with minimal modification when necessary. We investigate how to best support users in efficiently traversing the candidate set and locating the correct parse, in terms of speed and accuracy. In our user study, consisting of five annotators labeling 300 instances each, we find that combining keyword searching, where keywords can be used to query relevant candidates, and keyword suggestion, where representative keywords are automatically generated, enables fast and accurate annotation.},
   pdf           = {belyy_2022_k_best/paper.pdf},
+  doi           = {10.18653/v1/2022.acl-demo.11},
 }
 
 @inproceedings{Stoica:2021:retacred,
@@ -57,6 +61,7 @@ @inproceedings{Stoica:2021:retacred
   year          = {2021},
   abstract      = {TACRED is one of the largest and most widely used sentence-level relation extraction datasets. Proposed models that are evaluated using this dataset consistently set new state-of-the-art performance. However, they still exhibit large error rates despite leveraging external knowledge and unsupervised pretraining on large text corpora. A recent study suggested that this may be due to poor dataset quality. The study observed that over 50% of the most challenging sentences from the development and test sets are incorrectly labeled and account for an average drop of 8% f1-score in model performance. However, this study was limited to a small biased sample of 5k (out of a total of 106k) sentences, substantially restricting the generalizability and broader implications of its findings. In this paper, we address these shortcomings by: (i) performing a comprehensive study over the whole TACRED dataset, (ii) proposing an improved crowdsourcing strategy and deploying it to re-annotate the whole dataset, and (iii) performing a thorough analysis to understand how correcting the TACRED annotations affects previously published results. After verification, we observed that 23.9% of TACRED labels are incorrect. Moreover, evaluating several models on our revised dataset yields an average f1-score improvement of 14.3% and helps uncover significant relationships between the different models (rather than simply offsetting or scaling their scores by a constant factor). Finally, aside from our analysis we also release Re-TACRED, a new completely re-annotated version of the TACRED dataset that can be used to perform reliable evaluation of relation extraction models.},
   pdf           = {stoica_2021_retacred/paper.pdf},
+  doi           = {10.1609/aaai.v35I15.17631},
 }
 
 @inproceedings{Shin:2021:clamp,
@@ -68,6 +73,7 @@ @inproceedings{Shin:2021:clamp
   year          = {2021},
   abstract      = {We explore the use of large pretrained language models as few-shot semantic parsers. The goal in semantic parsing is to generate a structured meaning representation given a natural language input. However, language models are trained to generate natural language. To bridge the gap, we use language models to paraphrase inputs into a controlled sublanguage resembling English that can be automatically mapped to a target meaning representation. Our results demonstrate that with only a small amount of data and very little code to convert into English-like representations, our blueprint for rapidly bootstrapping semantic parsers leads to surprisingly effective performance on multiple community tasks, greatly exceeding baseline methods also trained on the same limited data.},
   pdf           = {shin_2021_clamp/paper.pdf},
+  doi           = {10.18653/v1/2021.emnlp-main.608},
 }
 
 @inproceedings{Platanios:2021:platypus,
@@ -80,6 +86,7 @@ @inproceedings{Platanios:2021:platypus
   abstract      = {Conversational semantic parsers map user utterances to executable programs given dialogue histories composed of previous utterances, programs, and system responses. Existing parsers typically condition on rich representations of history that include the complete set of values and computations previously discussed. We propose a model that abstracts over values to focus prediction on type- and function-level context. This approach provides a compact encoding of dialogue histories and predicted programs, improving generalization and computational efficiency. Our model incorporates several other components, including an atomic span copy operation and structural enforcement of well-formedness constraints on predicted programs, that are particularly advantageous in the low-data regime. Trained on the SMCalFlow and TreeDST datasets, our model outperforms prior work by 7.3% and 10.6% respectively in terms of absolute accuracy. Trained on only a thousand examples from each dataset, it outperforms strong baselines by 12.4% and 6.4%. These results indicate that simple representations are key to effective generalization in conversational semantic parsing.},
   pdf           = {platanios_2021_platypus/paper.pdf},
   slides        = {../pptx/platanios_2021_platypus/slides.pptx},
+  doi           = {10.18653/v1/2021.acl-long.284},
 }
 
 @inproceedings{Xian:2021:hyper_dynamics,
@@ -102,7 +109,8 @@ @inproceedings{Yin:2021:compositional_generalization
   year          = {2021},
   abstract      = {We describe a span-level supervised attention loss that improves compositional generalization in semantic parsers. Our approach builds on existing losses that encourage attention maps in neural sequence-to-sequence models to imitate the output of classical word alignment algorithms. Where past work has used word-level alignments, we focus on spans; borrowing ideas from phrase-based machine translation, we align subtrees in semantic parses to spans of input sentences, and encourage neural attention mechanisms to mimic these alignments. This method improves the performance of transformers, RNNs, and structured decoders on three benchmarks of compositional generalization.},
   pdf           = {yin_2021_compositional_generalization/paper.pdf},
-  code          = {https://github.com/microsoft/compositional-generalization-span-level-attention}
+  code          = {https://github.com/microsoft/compositional-generalization-span-level-attention},
+  doi           = {10.18653/v1/2021.naacl-main.225},
 }
 
 @thesis{Platanios:2020:thesis,
@@ -113,7 +121,8 @@ @thesis{Platanios:2020:thesis
   year          = {2020},
   pdf           = {thesis/thesis.pdf},
   slides        = {thesis/defense.pdf},
-  abstract      = {Human intelligence is magnificent. One of its most impressive aspects is how humans always seem able to learn new skills quickly and without much supervision by utilizing previously learned skills and forming connections between them. More specifically, human learning is often not about learning a single skill in isolation, but rather about learning collections of skills and utilizing relationships between them to learn more efficiently. Furthermore, these relationships may either be explicitly provided or implicitly learned, indicating high levels of abstraction in the learned abilities. On the other hand, even though machine learning has witnessed growing success across a multitude of applications over the past years, current systems are each highly specialized to solve one or just a handful of problems. In this thesis, we argue that a computer system that learns to perform multiple tasks jointly and that is aware of the relationships between these tasks, will be able to learn more efficiently and effectively than a system that learns to perform each task in isolation. Moreover, the relationships between the tasks may either be explicitly provided through supervision or implicitly learned by the system itself, and will allow the system to self-reflect and evaluate itself without any task-specific supervision. This includes learning relationships in the form of higher-order functions—namely functions that compose, transform, or otherwise manipulate other functions—that can enable truly multi-task and zero-shot learning. In the first part, we present a method that allows learning systems to evaluate themselves in an unsupervised manner by leveraging explicitly provided relationships between multiple learned functions. We refer to this ability as self-reflection and show how it addresses an important limitation of existing never-ending learning systems like the never-ending language learner (Mitchell et al., 2018). We then propose multiple extensions that improve upon this method, resulting in several robust algorithms for estimating the accuracy of classifiers from unlabeled data. In the second part, we consider more general multi-task learning settings and propose an abstract framework called contextual parameter generation (CPG), which allows systems to generate functions for solving different kinds of tasks without necessarily having been shown any training data for these tasks. This framework generalizes existing approaches in multi-task learning, transfer learning, and meta-learning, and it further allows for learning arbitrary higher-order functions. It does so by formalizing the notion of a function representation and what it means for functions to operate on other functions or even on themselves. This new type of learning, which we refer to as higher-order learning, enables learning relationships between multiple functions in the form of higher-order functions, and is inspired by functional programming and category theory. Finally, we propose the jelly bean world (JBW), a novel evaluation framework for never-ending learning systems.}
+  abstract      = {Human intelligence is magnificent. One of its most impressive aspects is how humans always seem able to learn new skills quickly and without much supervision by utilizing previously learned skills and forming connections between them. More specifically, human learning is often not about learning a single skill in isolation, but rather about learning collections of skills and utilizing relationships between them to learn more efficiently. Furthermore, these relationships may either be explicitly provided or implicitly learned, indicating high levels of abstraction in the learned abilities. On the other hand, even though machine learning has witnessed growing success across a multitude of applications over the past years, current systems are each highly specialized to solve one or just a handful of problems. In this thesis, we argue that a computer system that learns to perform multiple tasks jointly and that is aware of the relationships between these tasks, will be able to learn more efficiently and effectively than a system that learns to perform each task in isolation. Moreover, the relationships between the tasks may either be explicitly provided through supervision or implicitly learned by the system itself, and will allow the system to self-reflect and evaluate itself without any task-specific supervision. This includes learning relationships in the form of higher-order functions—namely functions that compose, transform, or otherwise manipulate other functions—that can enable truly multi-task and zero-shot learning. In the first part, we present a method that allows learning systems to evaluate themselves in an unsupervised manner by leveraging explicitly provided relationships between multiple learned functions. We refer to this ability as self-reflection and show how it addresses an important limitation of existing never-ending learning systems like the never-ending language learner (Mitchell et al., 2018). We then propose multiple extensions that improve upon this method, resulting in several robust algorithms for estimating the accuracy of classifiers from unlabeled data. In the second part, we consider more general multi-task learning settings and propose an abstract framework called contextual parameter generation (CPG), which allows systems to generate functions for solving different kinds of tasks without necessarily having been shown any training data for these tasks. This framework generalizes existing approaches in multi-task learning, transfer learning, and meta-learning, and it further allows for learning arbitrary higher-order functions. It does so by formalizing the notion of a function representation and what it means for functions to operate on other functions or even on themselves. This new type of learning, which we refer to as higher-order learning, enables learning relationships between multiple functions in the form of higher-order functions, and is inspired by functional programming and category theory. Finally, we propose the jelly bean world (JBW), a novel evaluation framework for never-ending learning systems.},
+  doi           = {10.1184/R1/13574678.V1},
 }
 
 @inproceedings{Platanios:2020:jbw,
@@ -125,7 +134,8 @@ @inproceedings{Platanios:2020:jbw
   year          = {2020},
   abstract      = {Machine learning has shown growing success in recent years. However, current machine learning systems are highly specialized, trained for particular problems or domains, and typically on a single narrow dataset. Human learning, on the other hand, is highly general and adaptable. Never-ending learning is a machine learning paradigm that aims to bridge this gap, with the goal of encouraging researchers to design machine learning systems that can learn to perform a wider variety of inter-related tasks in more complex environments. To date, there is no environment or testbed to facilitate the development and evaluation of never-ending learning systems. To this end, we propose the Jelly Bean World testbed. The Jelly Bean World allows experimentation over two-dimensional grid worlds which are filled with items and in which agents can navigate. This testbed provides environments that are sufficiently complex and where more generally intelligent algorithms ought to perform better than current state-of-the-art reinforcement learning approaches. It does so by producing non-stationary environments and facilitating experimentation with multi-task, multi-agent, multi-modal, and curriculum learning settings. We hope that this new freely-available software will prompt new research and interest in the development and evaluation of never-ending learning systems and more broadly, general intelligence systems.},
   pdf           = {platanios-2020-jbw-paper.pdf},
-  code          = {https://github.com/eaplatanios/jelly-bean-world}
+  code          = {https://github.com/eaplatanios/jelly-bean-world},
+  doi           = {10.48550/arXiv.2002.06306},
 }
 
 @inproceedings{Platanios:2020:coper,
@@ -136,7 +146,8 @@ @inproceedings{Platanios:2020:coper
   year          = {2020},
   abstract      = {We consider the task of knowledge graph link prediction. Given a question consisting of a source entity and a relation (e.g., Shakespeare and BornIn), the objective is to predict the most likely answer entity (e.g., England). Recent approaches tackle this problem by learning entity and relation embeddings. However, they often constrain the relationship between these embeddings to be additive (i.e., the embeddings are concatenated and then processed by a sequence of linear functions and element-wise non-linearities). We show that this type of interaction significantly limits representational power. For example, such models cannot handle cases where a different projection of the source entity is used for each relation. We propose to use contextual parameter generation to address this limitation. More specifically, we treat relations as the context in which source entities are processed to produce predictions, by using relation embeddings to generate the parameters of a model operating over source entity embeddings. This allows models to represent more complex interactions between entities and relations. We apply our method on two existing link prediction methods, including the current state-of-the-art, resulting in significant performance gains and establishing a new state-of-the-art for this task. These gains are achieved while also reducing training time by up to 28 times.},
   pdf           = {platanios_2020_coper/paper.pdf},
-  code          = {https://github.com/otiliastr/coper}
+  code          = {https://github.com/otiliastr/coper},
+  doi           = {10.1609/aaai.v34i03.5693},
 }
 
 @inproceedings{Stretcu:2019,
@@ -164,7 +175,8 @@ @inproceedings{Platanios:2019
   pdf           = {platanios_2019_curriculum_nmt/paper.pdf},
   poster        = {platanios_2019_curriculum_nmt/poster.pdf},
   slides        = {platanios_2019_curriculum_nmt/slides.pdf},
-  code          = {https://github.com/eaplatanios/symphony-mt}
+  code          = {https://github.com/eaplatanios/symphony-mt},
+  doi           = {10.18653/v1/N19-1119},
 }
 
 @inproceedings{Platanios:2018,
@@ -180,7 +192,8 @@ @inproceedings{Platanios:2018
   pdf           = {platanios_2018_cpg_nmt/paper.pdf},
   poster        = {platanios_2018_cpg_nmt/poster.pdf},
   slides        = {platanios_2018_cpg_nmt/slides.pdf},
-  code          = {https://github.com/eaplatanios/symphony-mt}
+  code          = {https://github.com/eaplatanios/symphony-mt},
+  doi           = {10.18653/v1/D18-1039},
 }
 
 @article{Mitchell:2018:cacm,
@@ -197,12 +210,12 @@ @article{Mitchell:2018:cacm
   pages         = {103--115},
   numpages      = {13},
   url           = {http://doi.acm.org/10.1145/3191513},
-  doi           = {10.1145/3191513},
   acmid         = {3191513},
   publisher     = {ACM},
   address       = {New York, NY, USA},
   pdf           = {mitchell_2018_cacm/paper.pdf},
-  abstract      = {Whereas people learn many different types of knowledge from diverse experiences over many years, and become better learners over time, most current machine learning systems are much more narrow, learning just a single function or data model based on statistical analysis of a single data set. We suggest that people learn better than computers precisely because of this difference, and we suggest a key direction for machine learning research is to develop software architectures that enable intelligent agents to also learn many types of knowledge, continuously over many years, and to become better learners over time. In this paper we define more precisely this never-ending learning paradigm for machine learning, and we present one case study: the Never-Ending Language Learner (NELL), which achieves a number of the desired properties of a never-ending learner. NELL has been learning to read the Web 24hrs/day since January 2010, and so far has acquired a knowledge base with 120mn diverse, confidence-weighted beliefs (e.g., servedWith(tea,biscuits)), while learning thousands of interrelated functions that continually improve its reading competence over time. NELL has also learned to reason over its knowledge base to infer new beliefs it has not yet read from those it has, and NELL is inventing new relational predicates to extend the ontology it uses to represent beliefs. We describe the design of NELL, experimental results illustrating its behavior, and discuss both its successes and shortcomings as a case study in never-ending learning. NELL can be tracked online at http://rtw.ml.cmu.edu, and followed on Twitter at @CMUNELL.}
+  abstract      = {Whereas people learn many different types of knowledge from diverse experiences over many years, and become better learners over time, most current machine learning systems are much more narrow, learning just a single function or data model based on statistical analysis of a single data set. We suggest that people learn better than computers precisely because of this difference, and we suggest a key direction for machine learning research is to develop software architectures that enable intelligent agents to also learn many types of knowledge, continuously over many years, and to become better learners over time. In this paper we define more precisely this never-ending learning paradigm for machine learning, and we present one case study: the Never-Ending Language Learner (NELL), which achieves a number of the desired properties of a never-ending learner. NELL has been learning to read the Web 24hrs/day since January 2010, and so far has acquired a knowledge base with 120mn diverse, confidence-weighted beliefs (e.g., servedWith(tea,biscuits)), while learning thousands of interrelated functions that continually improve its reading competence over time. NELL has also learned to reason over its knowledge base to infer new beliefs it has not yet read from those it has, and NELL is inventing new relational predicates to extend the ontology it uses to represent beliefs. We describe the design of NELL, experimental results illustrating its behavior, and discuss both its successes and shortcomings as a case study in never-ending learning. NELL can be tracked online at http://rtw.ml.cmu.edu, and followed on Twitter at @CMUNELL.},
+  doi           = {10.1145/3191513},
 }
 
 @eprint{Platanios:2018:agreement_based_learning,
@@ -215,7 +228,8 @@ @eprint{Platanios:2018:agreement_based_learning
   abbr          = {arXiv},
   year          = {2018},
   pdf           = {platanios_2018_agreement_based_learning/paper.pdf},
-  abstract      = {{Model selection is a problem that has occupied machine learning researchers for a long time. Recently, its importance has become evident through applications in deep learning. We propose an agreement-based learning framework that prevents many of the pitfalls associated with model selection. It relies on coupling the training of multiple models by encouraging them to agree on their predictions while training. In contrast with other model selection and combination approaches used in machine learning, the proposed framework is inspired by human learning. We also propose a learning algorithm defined within this framework which manages to significantly outperform alternatives in practice, and whose performance improves further with the availability of unlabeled data. Finally, we describe a number of potential directions for developing more flexible agreement-based learning algorithms.}}
+  abstract      = {{Model selection is a problem that has occupied machine learning researchers for a long time. Recently, its importance has become evident through applications in deep learning. We propose an agreement-based learning framework that prevents many of the pitfalls associated with model selection. It relies on coupling the training of multiple models by encouraging them to agree on their predictions while training. In contrast with other model selection and combination approaches used in machine learning, the proposed framework is inspired by human learning. We also propose a learning algorithm defined within this framework which manages to significantly outperform alternatives in practice, and whose performance improves further with the availability of unlabeled data. Finally, we describe a number of potential directions for developing more flexible agreement-based learning algorithms.}},
+  doi           = {10.48550/arXiv.1806.01258},
 }
 
 @eprint{Platanios:2018:deep_graphs,
@@ -228,7 +242,8 @@ @eprint{Platanios:2018:deep_graphs
   abbr          = {arXiv},
   year          = {2018},
   pdf           = {platanios_2018_deep_graphs/paper.pdf},
-  abstract      = {{We propose an algorithm for deep learning on networks and graphs. It relies on the notion that many graph algorithms, such as PageRank, Weisfeiler-Lehman, or Message Passing can be expressed as iterative vertex updates. Unlike previous methods which rely on the ingenuity of the designer, Deep Graphs are adaptive to the estimation problem. Training and deployment are both efficient, since the cost is O(|E|+|V|), where E and V are the sets of edges and vertices respectively. In short, we learn the recurrent update functions rather than positing their specific functional form. This yields an algorithm that achieves excellent accuracy on both graph labeling and regression tasks.}}
+  abstract      = {{We propose an algorithm for deep learning on networks and graphs. It relies on the notion that many graph algorithms, such as PageRank, Weisfeiler-Lehman, or Message Passing can be expressed as iterative vertex updates. Unlike previous methods which rely on the ingenuity of the designer, Deep Graphs are adaptive to the estimation problem. Training and deployment are both efficient, since the cost is O(|E|+|V|), where E and V are the sets of edges and vertices respectively. In short, we learn the recurrent update functions rather than positing their specific functional form. This yields an algorithm that achieves excellent accuracy on both graph labeling and regression tasks.}},
+  doi           = {10.48550/arXiv.1806.01235},
 }
 
 @eprint{Platanios:2017:active_learning,
@@ -241,7 +256,8 @@ @eprint{Platanios:2017:active_learning
   abbr          = {arXiv},
   year          = {2017},
   pdf           = {platanios_2017_active_learning/paper.pdf},
-  abstract      = {{Structured prediction is ubiquitous in applications of machine learning such as knowledge extraction and natural language processing. Structure often can be formulated in terms of logical constraints. We consider the question of how to perform efficient active learning in the presence of logical constraints among variables inferred by different classifiers. We propose several methods and provide theoretical results that demonstrate the inappropriateness of employing uncertainty guided sampling, a commonly used active learning method. Furthermore, experiments on ten different datasets demonstrate that the methods significantly outperform alternatives in practice. The results are of practical significance in situations where labeled data is scarce.}}
+  abstract      = {{Structured prediction is ubiquitous in applications of machine learning such as knowledge extraction and natural language processing. Structure often can be formulated in terms of logical constraints. We consider the question of how to perform efficient active learning in the presence of logical constraints among variables inferred by different classifiers. We propose several methods and provide theoretical results that demonstrate the inappropriateness of employing uncertainty guided sampling, a commonly used active learning method. Furthermore, experiments on ten different datasets demonstrate that the methods significantly outperform alternatives in practice. The results are of practical significance in situations where labeled data is scarce.}},
+  doi           = {10.48550/arXiv.1709.08850},
 }
 
 @inproceedings{Platanios:2017:accuracy_estimation_logic,
@@ -254,7 +270,8 @@ @inproceedings{Platanios:2017:accuracy_estimation_logic
   pdf           = {platanios_2017_logic/paper.pdf},
   supp          = {platanios_2017_logic/supplementary.pdf},
   poster        = {platanios_2017_logic/poster.pdf},
-  abstract      = {{We propose an efﬁcient method to estimate the accuracy of classiﬁers using only unlabeled data. We consider a setting with multiple classiﬁcation problems where the target classes may be tied together through logical constraints. For example, a set of classes may be mutually exclusive, meaning that a data instance can belong to at most one of them. The proposed method is based on the intuition that: (i) when classiﬁers agree, they are more likely to be correct, and (ii) when the classiﬁers make a prediction that violates the constraints, at least one classiﬁer must be making an error. Experiments on four real-world data sets produce accuracy estimates within a few percent of the true accuracy, using solely unlabeled data. Our models also outperform existing state-of-the-art solutions in both estimating accuracies, and combining multiple classiﬁer outputs. The results emphasize the utility of logical constraints in estimating accuracy, thus validating our intuition.}}
+  abstract      = {{We propose an efﬁcient method to estimate the accuracy of classiﬁers using only unlabeled data. We consider a setting with multiple classiﬁcation problems where the target classes may be tied together through logical constraints. For example, a set of classes may be mutually exclusive, meaning that a data instance can belong to at most one of them. The proposed method is based on the intuition that: (i) when classiﬁers agree, they are more likely to be correct, and (ii) when the classiﬁers make a prediction that violates the constraints, at least one classiﬁer must be making an error. Experiments on four real-world data sets produce accuracy estimates within a few percent of the true accuracy, using solely unlabeled data. Our models also outperform existing state-of-the-art solutions in both estimating accuracies, and combining multiple classiﬁer outputs. The results emphasize the utility of logical constraints in estimating accuracy, thus validating our intuition.}},
+  doi           = {10.48550/arXiv.1705.07086},
 }
 
 @inproceedings{Platanios:2016ti,
@@ -279,7 +296,8 @@ @inproceedings{Mitchell:2015wo
   year          = {2015},
   pages         = {1--9},
   pdf           = {mitchell_2015wo/mitchell_2015wo.pdf},
-  abstract      = {Whereas people learn many different types of knowledge from diverse experiences over many years, most current machine learning systems acquire just a single function or data model from just a single data set. We propose a neverending learning paradigm for machine learning, to better reflect the more ambitious and encompassing type of learning performed by humans. As a case study, we describe the Never-Ending Language Learner (NELL), which achieves some of the desired properties of a never-ending learner, and we discuss lessons learned. NELL has been learning to read the web 24 hours/day since January 2010, and so far has acquired a knowledge base with over 80 million confidenceweighted beliefs (e.g., servedWith(tea, biscuits)). NELL has also learned millions of features and parameters that enable it to read these beliefs from the web. Additionally, it has learned to reason over these beliefs to infer new beliefs, and is able to extend its ontology by synthesizing new relational predicates. NELL can be tracked online at http://rtw.ml.cmu.edu, and followed on Twitter at @CMUNELL.}
+  abstract      = {Whereas people learn many different types of knowledge from diverse experiences over many years, most current machine learning systems acquire just a single function or data model from just a single data set. We propose a neverending learning paradigm for machine learning, to better reflect the more ambitious and encompassing type of learning performed by humans. As a case study, we describe the Never-Ending Language Learner (NELL), which achieves some of the desired properties of a never-ending learner, and we discuss lessons learned. NELL has been learning to read the web 24 hours/day since January 2010, and so far has acquired a knowledge base with over 80 million confidenceweighted beliefs (e.g., servedWith(tea, biscuits)). NELL has also learned millions of features and parameters that enable it to read these beliefs from the web. Additionally, it has learned to reason over these beliefs to infer new beliefs, and is able to extend its ontology by synthesizing new relational predicates. NELL can be tracked online at http://rtw.ml.cmu.edu, and followed on Twitter at @CMUNELL.},
+  doi           = {10.1609/aaai.v29i1.9498},
 }
 
 @thesis{Platanios:2015ui,
@@ -304,7 +322,8 @@ @inproceedings{Platanios:2014ti
   pdf           = {platanios_2014ti/platanios_2014ti.pdf},
   poster        = {platanios_2014ti/platanios_2014ti_poster.pdf},
   addendum      = {platanios_2014ti/platanios_2014ti_addendum.pdf},
-  abstract      = {We consider the question of how unlabeled data can be used to estimate the true accuracy of learned classifiers. This is an important question for any autonomous learning system that must estimate its accuracy without supervision, and also when classifiers trained from one data distribution must be applied to a new distribution (e.g., document classifiers trained on one text corpus are to be applied to a second corpus). We first show how to estimate error rates exactly from unlabeled data when given a collection of competing classifiers that make independent errors, based on the agreement rates between subsets of these classifiers. We further show that even when the competing classifiers do not make independent errors, both their accuracies and error dependencies can be estimated by making certain relaxed assumptions. Experiments on two data real-world data sets produce estimates within a few percent of the true accuracy, using solely unlabeled data. These results are of practical significance in situations where labeled data is scarce and shed light on the more general question of how the consistency among multiple functions is related to their true accuracies.}
+  abstract      = {We consider the question of how unlabeled data can be used to estimate the true accuracy of learned classifiers. This is an important question for any autonomous learning system that must estimate its accuracy without supervision, and also when classifiers trained from one data distribution must be applied to a new distribution (e.g., document classifiers trained on one text corpus are to be applied to a second corpus). We first show how to estimate error rates exactly from unlabeled data when given a collection of competing classifiers that make independent errors, based on the agreement rates between subsets of these classifiers. We further show that even when the competing classifiers do not make independent errors, both their accuracies and error dependencies can be estimated by making certain relaxed assumptions. Experiments on two data real-world data sets produce estimates within a few percent of the true accuracy, using solely unlabeled data. These results are of practical significance in situations where labeled data is scarce and shed light on the more general question of how the consistency among multiple functions is related to their true accuracies.},
+  doi           = {10.5555/3020751.3020822},
 }
 
 @article{Platanios:2014gp,
@@ -318,7 +337,8 @@ @article{Platanios:2014gp
   pages         = {888--900},
   month         = may, 
   pdf           = {platanios_2014gp/platanios_2014gp.pdf}, 
-  abstract      = {Generalized autoregressive conditional heteroscedasticity (GARCH) models have long been considered as one of the most successful families of approaches for volatility modeling in ﬁnancial return series. In this paper, we propose an alternative approach based on methodologies widely used in the ﬁeld of statistical machine learning. Speciﬁcally, we propose a novel nonparametric Bayesian mixture of Gaussian process regression models, each component of which models the noise variance process that contaminates the observed data as a separate latent Gaussian process driven by the observed data. This way, we essentially obtain a Gaussian process-mixture conditional heteroscedasticity (GPMCH) model for volatility modeling in ﬁnancial return series. We impose a nonparametric prior with power-law nature over the distribution of the model mixture components, namely the Pitman-Yor process prior, to allow for better capturing modeled data distributions with heavy tails and skewness. Finally, we provide a copula-based approach for obtaining a predictive posterior for the covariances over the asset returns modeled by means of a postulated GPMCH model. We evaluate the efﬁcacy of our approach in a number of benchmark scenarios, and compare its performance to state-of-the-art methodologies.}
+  abstract      = {Generalized autoregressive conditional heteroscedasticity (GARCH) models have long been considered as one of the most successful families of approaches for volatility modeling in ﬁnancial return series. In this paper, we propose an alternative approach based on methodologies widely used in the ﬁeld of statistical machine learning. Speciﬁcally, we propose a novel nonparametric Bayesian mixture of Gaussian process regression models, each component of which models the noise variance process that contaminates the observed data as a separate latent Gaussian process driven by the observed data. This way, we essentially obtain a Gaussian process-mixture conditional heteroscedasticity (GPMCH) model for volatility modeling in ﬁnancial return series. We impose a nonparametric prior with power-law nature over the distribution of the model mixture components, namely the Pitman-Yor process prior, to allow for better capturing modeled data distributions with heavy tails and skewness. Finally, we provide a copula-based approach for obtaining a predictive posterior for the covariances over the asset returns modeled by means of a postulated GPMCH model. We evaluate the efﬁcacy of our approach in a number of benchmark scenarios, and compare its performance to state-of-the-art methodologies.},
+  doi           = {10.1109/TPAMI.2013.183},
 }
 
 @inproceedings{Platanios:2012uh,
diff --git a/_layouts/default.html b/_layouts/default.html
index 3f797ed6b50b..1b5257fd5fc7 100644
--- a/_layouts/default.html
+++ b/_layouts/default.html
@@ -15,6 +15,9 @@
   <link rel="stylesheet" href="{{ '/assets/css/academicons.min.css' | prepend: site.baseurl }}">
   <link rel="stylesheet" href="{{ '/assets/css/main.css' | prepend: site.baseurl }}">
   <link rel="canonical" href="{{ page.url | replace:'index.html','' | prepend: site.baseurl }}">
+
+  <!-- Scripts -->
+  <script async src="https://badge.dimensions.ai/badge.js" charset="utf-8"></script>
 </head>
 <body>
   <!-- Header -->
diff --git a/_layouts/publication.html b/_layouts/publication.html
index 1e85c1afa9b6..c77bed4f9b8e 100644
--- a/_layouts/publication.html
+++ b/_layouts/publication.html
@@ -110,6 +110,16 @@ <h5 class="title mb-0">{{entry.title}}.</h5>
         {% if entry.arxiv %}
           <a class="badge grey waves-effect font-weight-light mr-1" href="http://arxiv.org/abs/{{ entry.arxiv }}" target="_blank">arXiv</a>
         {% endif %}
+        <!-- {% if entry.doi %}
+          <div
+            class="__dimensions_badge_embed__"
+            data-doi="{{ entry.doi }}"
+            data-hide-zero-citations="true"
+            data-style="small_rectangle"
+            data-legend="hover-right"
+            style="display: inline-block; margin-bottom: 10px;"
+          ></div>
+        {% endif %} -->
       </div>
     
       {% if entry.abstract %}