People

Pablo Sánchez
E: sanchez@cs.uni-saarland.de
About me
I started my PhD in September 2019, supervised by Prof. Valera & Prof. Sonja Utz (from Leibniz-Institut für Wissensmedien). I am also part of the International Max Planck Research School for Intelligent Systems (IMPRS-IS) PhD program.
Broadly speaking, my research is focused on building machine learning methods for the analysis of real world data. I am specially focused on (social) network data, such as Twitter. Apart from handling real world data, I also want these model to give predictions that i) people can understand and ii) are are able to work under unexpected settings. Thus, interpretability and robustness are two research topics I am very interested about.
Publications
2024
Sánchez-Martin, Pablo; Utz, Sonja; Valera, Isabel
Exploring the Boundaries of Ambient Awareness in Twitter Journal Article
In: CoRR, vol. abs/2403.17776, 2024.
@article{DBLP:journals/corr/abs-2403-17776,
title = {Exploring the Boundaries of Ambient Awareness in Twitter},
author = {Pablo Sánchez-Martin and Sonja Utz and Isabel Valera},
url = {https://doi.org/10.48550/arXiv.2403.17776},
doi = {10.48550/ARXIV.2403.17776},
year = {2024},
date = {2024-01-01},
urldate = {2024-01-01},
journal = {CoRR},
volume = {abs/2403.17776},
abstract = {Ambient awareness refers to the ability of social media users to obtain knowledge about who knows what (i.e., users' expertise) in their network, by simply being exposed to other users' content (e.g, tweets on Twitter). Previous work, based on user surveys, reveals that individuals self-report ambient awareness only for parts of their networks. However, it is unclear whether it is their limited cognitive capacity or the limited exposure to diagnostic tweets (i.e., online content) that prevents people from developing ambient awareness for their complete network. In this work, we focus on in-wall ambient awareness (IWAA) in Twitter and conduct a two-step data-driven analysis, that allows us to explore to which extent IWAA is likely, or even possible. First, we rely on reactions (e.g., likes), as strong evidence of users being aware of experts in Twitter. Unfortunately, such strong evidence can be only measured for active users, which represent the minority in the network. Thus to study the boundaries of IWAA to a larger extent, in the second part of our analysis, we instead focus on the passive exposure to content generated by other users -- which we refer to as in-wall visibility. This analysis shows that (in line with citet{levordashka2016ambient}) only for a subset of users IWAA is plausible, while for the majority it is unlikely, if even possible, to develop IWAA. We hope that our methodology paves the way for the emergence of data-driven approaches for the study of ambient awareness.},
keywords = {},
pubstate = {published},
tppubtype = {article}
}
Sánchez-Martin, Pablo; Khan, Kinaan Aamir; Valera, Isabel
Improving the interpretability of GNN predictions through conformal-based graph sparsification Journal Article
In: CoRR, vol. abs/2404.12356, 2024.
@article{DBLP:journals/corr/abs-2404-12356,
title = {Improving the interpretability of GNN predictions through conformal-based graph sparsification},
author = {Pablo Sánchez-Martin and Kinaan Aamir Khan and Isabel Valera},
url = {https://doi.org/10.48550/arXiv.2404.12356},
doi = {10.48550/ARXIV.2404.12356},
year = {2024},
date = {2024-01-01},
urldate = {2024-01-01},
journal = {CoRR},
volume = {abs/2404.12356},
abstract = {Graph Neural Networks (GNNs) have achieved state-of-the-art performance in solving graph classification tasks. However, most GNN architectures aggregate information from all nodes and edges in a graph, regardless of their relevance to the task at hand, thus hindering the interpretability of their predictions. In contrast to prior work, in this paper we propose a GNN emph{training} approach that jointly i) finds the most predictive subgraph by removing edges and/or nodes -- -emph{without making assumptions about the subgraph structure} -- while ii) optimizing the performance of the graph classification task. To that end, we rely on reinforcement learning to solve the resulting bi-level optimization with a reward function based on conformal predictions to account for the current in-training uncertainty of the classifier. Our empirical results on nine different graph classification datasets show that our method competes in performance with baselines while relying on significantly sparser subgraphs, leading to more interpretable GNN-based predictions.},
keywords = {},
pubstate = {published},
tppubtype = {article}
}
2023
Javaloy, Adrián; Sánchez-Mart'ın, Pablo; Valera, Isabel
Causal normalizing flows: from theory to practice Journal Article
In: CoRR, vol. abs/2306.05415, 2023.
@article{DBLP:journals/corr/abs-2306-05415,
title = {Causal normalizing flows: from theory to practice},
author = {Adrián Javaloy and Pablo Sánchez-Mart'ın and Isabel Valera},
url = {https://doi.org/10.48550/arXiv.2306.05415},
doi = {10.48550/arXiv.2306.05415},
year = {2023},
date = {2023-01-01},
urldate = {2023-01-01},
journal = {CoRR},
volume = {abs/2306.05415},
abstract = {In this work, we deepen on the use of normalizing flows for causal reasoning. Specifically, we first leverage recent results on non-linear ICA to show that causal models are identifiable from observational data given a causal ordering, and thus can be recovered using autoregressive normalizing flows (NFs). Second, we analyze different design and learning choices for causal normalizing flows to capture the underlying causal data-generating process. Third, we describe how to implement the do-operator in causal NFs, and thus, how to answer interventional and counterfactual questions. Finally, in our experiments, we validate our design and training choices through a comprehensive ablation study; compare causal NFs to other approaches for approximating causal models; and empirically demonstrate that causal NFs can be used to address real-world problems—where the presence of mixed discrete-continuous data and partial knowledge on the causal graph is the norm. The code for this work can be found at https://github.com/psanch21/causal-flows.},
keywords = {},
pubstate = {published},
tppubtype = {article}
}
Sánchez-Mart'ın, Pablo; Olmos, Pablo M.; Pérez-Cruz, Fernando
Enhancing diversity in GANs via non-uniform sampling Journal Article
In: Inf. Sci., vol. 637, pp. 118928, 2023.
@article{DBLP:journals/isci/SanchezMartinOP23,
title = {Enhancing diversity in GANs via non-uniform sampling},
author = {Pablo Sánchez-Mart'ın and Pablo M. Olmos and Fernando Pérez-Cruz},
url = {https://doi.org/10.1016/j.ins.2023.04.007},
doi = {10.1016/j.ins.2023.04.007},
year = {2023},
date = {2023-01-01},
urldate = {2023-01-01},
journal = {Inf. Sci.},
volume = {637},
pages = {118928},
abstract = {Recent advances in Generative Adversarial Networks (GANs) have led to impressive results in generating realistic data. However, GANs training is still challenging, often leading to mode-collapse, where a certain type of samples dominates the generated output. To address this issue, we propose a novel training algorithm based on bidirectional GANs (BiGANs) that can be generalized to any implicit generative model. Our algorithm relies on a non-uniform sampling scheme, where data points in a minibatch are sampled with probability inversely proportional to their log-evidence. However, estimating log-evidence is computationally expensive. Instead, we propose to use the reconstruction error, which directly correlates with the log-evidence and only requires a BiGAN network evaluation. Additionally, we combine the aforementioned method with a regularization in the empirical distribution of the encoder that further boosts the performance. Our empirical results show that the proposed methods improve both the quality and diversity of the generated samples.},
keywords = {},
pubstate = {published},
tppubtype = {article}
}
Javaloy, Adrián; Sánchez-Mart'ın, Pablo; Levi, Amit; Valera, Isabel
Learnable Graph Convolutional Attention Networks Proceedings Article
In: The Eleventh International Conference on Learning Representations, ICLR 2023, Kigali, Rwanda, May 1-5, 2023, OpenReview.net, 2023.
@inproceedings{DBLP:conf/iclr/JavaloySLV23,
title = {Learnable Graph Convolutional Attention Networks},
author = {Adrián Javaloy and Pablo Sánchez-Mart'ın and Amit Levi and Isabel Valera},
url = {https://openreview.net/pdf?id=WsUMeHPo-2},
year = {2023},
date = {2023-01-01},
urldate = {2023-01-01},
booktitle = {The Eleventh International Conference on Learning Representations,
ICLR 2023, Kigali, Rwanda, May 1-5, 2023},
publisher = {OpenReview.net},
abstract = {Existing Graph Neural Networks (GNNs) compute the message exchange between nodes by either aggregating uniformly (convolving) the features of all the neighbor- ing nodes, or by applying a non-uniform score (attending) to the features. Recent works have shown the strengths and weaknesses of the resulting GNN architectures, respectively, GCNs and GATs. In this work, we aim at exploiting the strengths of both approaches to their full extent. To this end, we first introduce the graph convolutional attention layer (CAT), which relies on convolutions to compute the attention scores. Unfortunately, as in the case of GCNs and GATs, we show that there exists no clear winner between the three—neither theoretically nor in practice—as their performance directly depends on the nature of the data (i.e., of the graph and features). This result brings us to the main contribution of our work, the learnable graph convolutional attention network (L-CAT): a GNN architecture that automatically interpolates between GCN, GAT and CAT in each layer, by adding only two scalar parameters. Our results demonstrate that L-CAT is able to efficiently combine different GNN layers along the network, outperforming competing methods in a wide range of datasets, and resulting in a more robust model that reduces the need of cross-validating.},
keywords = {},
pubstate = {published},
tppubtype = {inproceedings}
}
Reyes-Sanchez, Manuel; Amaducci, Rodrigo; Sánchez-Mart'ın, Pablo; Elices, Irene; Rodr'ıguez, Francisco Borja; Varona, Pablo
Automatized offline and online exploration to achieve a target dynamics in biohybrid neural circuits built with living and model neurons Journal Article
In: Neural Networks, vol. 164, pp. 464–475, 2023.
@article{DBLP:journals/nn/ReyesSanchezASERV23,
title = {Automatized offline and online exploration to achieve a target dynamics in biohybrid neural circuits built with living and model neurons},
author = {Manuel Reyes-Sanchez and Rodrigo Amaducci and Pablo Sánchez-Mart'ın and Irene Elices and Francisco Borja Rodr'ıguez and Pablo Varona},
url = {https://doi.org/10.1016/j.neunet.2023.04.034},
doi = {10.1016/J.NEUNET.2023.04.034},
year = {2023},
date = {2023-01-01},
urldate = {2023-01-01},
journal = {Neural Networks},
volume = {164},
pages = {464–475},
abstract = {Biohybrid circuits of interacting living and model neurons are an advantageous means to study neural dynamics and to assess the role of specific neuron and network properties in the nervous system. Hybrid networks are also a necessary step to build effective artificial intelligence and brain hybridization. In this work, we deal with the automatized online and offline adaptation, exploration and parameter mapping to achieve a target dynamics in hybrid circuits and, in particular, those that yield dynamical invariants between living and model neurons. We address dynamical invariants that form robust cycle-by-cycle relationships between the intervals that build neural sequences from such interaction. Our methodology first attains automated adaptation of model neurons to work in the same amplitude regime and time scale of living neurons. Then, we address the automatized exploration and mapping of the synapse parameter space that lead to a specific dynamical invariant target. Our approach uses multiple configurations and parallel computing from electrophysiological recordings of living neurons to build full mappings, and genetic algorithms to achieve an instance of the target dynamics for the hybrid circuit in a short time. We illustrate and validate such strategy in the context of the study of functional sequences in neural rhythms, which can be easily generalized for any variety of hybrid circuit configuration. This approach facilitates both the building of hybrid circuits and the accomplishment of their scientific goal.},
keywords = {},
pubstate = {published},
tppubtype = {article}
}
Koyuncu, Batuhan; Sánchez-Mart'ın, Pablo; Peis, Ignacio; Olmos, Pablo M.; Valera, Isabel
Variational Mixture of HyperGenerators for Learning Distributions Over Functions Journal Article
In: CoRR, vol. abs/2302.06223, 2023.
@article{DBLP:journals/corr/abs-2302-06223,
title = {Variational Mixture of HyperGenerators for Learning Distributions Over Functions},
author = {Batuhan Koyuncu and Pablo Sánchez-Mart'ın and Ignacio Peis and Pablo M. Olmos and Isabel Valera},
url = {https://doi.org/10.48550/arXiv.2302.06223},
doi = {10.48550/arXiv.2302.06223},
year = {2023},
date = {2023-01-01},
urldate = {2023-01-01},
journal = {CoRR},
volume = {abs/2302.06223},
abstract = {Recent approaches build on implicit neural representations (INRs) to propose generative models over function spaces. However, they are computationally costly when dealing with inference tasks, such as missing data imputation, or directly cannot tackle them. In this work, we propose a novel deep generative model, named VAMoH. VAMoH combines the capabilities of modeling continuous functions using INRs and the inference capabilities of Variational Autoencoders (VAEs). In addition, VAMoH relies on a normalizing flow to define the prior, and a mixture of hypernetworks to parametrize the data log-likelihood. This gives VAMoH a high expressive capability and interpretability. Through experiments on a diverse range of data types, such as images, voxels, and climate data, we show that VAMoH can effectively learn rich distributions over continuous functions. Furthermore, it can perform inference-related tasks, such as conditional super-resolution generation and in-painting, as well or better than previous approaches, while being less computationally demanding.},
keywords = {},
pubstate = {published},
tppubtype = {article}
}
2022
Sánchez-Mart'ın, Pablo; Rateike, Miriam; Valera, Isabel
VACA: Designing Variational Graph Autoencoders for Causal Queries Proceedings Article
In: Thirty-Sixth AAAI Conference on Artificial Intelligence, AAAI 2022, Thirty-Fourth Conference on Innovative Applications of Artificial Intelligence, IAAI 2022, The Twelveth Symposium on Educational Advances in Artificial Intelligence, EAAI 2022 Virtual Event, February 22 - March 1, 2022, pp. 8159–8168, AAAI Press, 2022.
@inproceedings{DBLP:conf/aaai/Sanchez-MartinR22b,
title = {VACA: Designing Variational Graph Autoencoders for Causal Queries},
author = {Pablo Sánchez-Mart'ın and Miriam Rateike and Isabel Valera},
url = {https://ojs.aaai.org/index.php/AAAI/article/view/20789},
year = {2022},
date = {2022-01-01},
urldate = {2022-01-01},
booktitle = {Thirty-Sixth AAAI Conference on Artificial Intelligence, AAAI
2022, Thirty-Fourth Conference on Innovative Applications of Artificial
Intelligence, IAAI 2022, The Twelveth Symposium on Educational Advances
in Artificial Intelligence, EAAI 2022 Virtual Event, February 22
- March 1, 2022},
pages = {8159–8168},
publisher = {AAAI Press},
abstract = {In this paper, we introduce VACA, a novel class of variational graph autoencoders for causal inference in the absence of hidden confounders, when only observational data and the causal graph are available. Without making any parametric assumptions, VACA mimics the necessary properties of a Structural Causal Model (SCM) to provide a flexible and practical framework for approximating interventions (do-operator) and abduction-action-prediction steps. As a result, and as shown by our empirical results, VACA accurately approximates the interventional and counterfactual distributions on diverse SCMs. Finally, we apply VACA to evaluate counterfactual fairness in fair classification problems, as well as to learn fair classifiers without compromising performance.},
keywords = {},
pubstate = {published},
tppubtype = {inproceedings}
}
2019
Sánchez-Martín, Pablo; Olmos, Pablo M.; Pérez-Cruz, Fernando
Out-of-Sample Testing for GANs Journal Article
In: CoRR, vol. abs/1901.09557, 2019.
@article{DBLP:journals/corr/abs-1901-09557,
title = {Out-of-Sample Testing for GANs},
author = {Pablo Sánchez-Martín and Pablo M. Olmos and Fernando Pérez-Cruz},
url = {http://arxiv.org/abs/1901.09557},
year = {2019},
date = {2019-01-01},
urldate = {2019-01-01},
journal = {CoRR},
volume = {abs/1901.09557},
abstract = {We propose a new method to evaluate GANs, namely EvalGAN. EvalGAN relies on a test set to directly measure the reconstruction quality in the original sample space (no auxiliary networks are necessary), and it also computes the (log)likelihood for the reconstructed samples in the test set. Further, EvalGAN is agnostic to the GAN algorithm and the dataset. We decided to test it on three state-of-the-art GANs over the well-known CIFAR-10 and CelebA datasets.},
keywords = {},
pubstate = {published},
tppubtype = {article}
}
Sánchez-Martín, Pablo; Olmos, Pablo M.; Pérez-Cruz, Fernando
Improved BiGAN training with marginal likelihood equalization Journal Article
In: CoRR, vol. abs/1911.01425, 2019.
@article{DBLP:journals/corr/abs-1911-01425,
title = {Improved BiGAN training with marginal likelihood equalization},
author = {Pablo Sánchez-Martín and Pablo M. Olmos and Fernando Pérez-Cruz},
url = {http://arxiv.org/abs/1911.01425},
year = {2019},
date = {2019-01-01},
urldate = {2019-01-01},
journal = {CoRR},
volume = {abs/1911.01425},
abstract = {We propose a novel training procedure for improving the performance of generative adversarial networks (GANs), especially to bidirectional GANs. First, we enforce that the empirical distribution of the inverse inference network matches the prior distribution, which favors the generator network reproducibility on the seen samples. Second, we have found that the marginal log-likelihood of the samples shows a severe overrepresentation of a certain type of samples. To address this issue, we propose to train the bidirectional GAN using a non-uniform sampling for the mini-batch selection, resulting in improved quality and variety in generated samples measured quantitatively and by visual inspection. We illustrate our new procedure with the well-known CIFAR10, Fashion MNIST and CelebA datasets.},
keywords = {},
pubstate = {published},
tppubtype = {article}
}
