Update bibliography

2022-10-20 14:23:02 +02:00 · 2022-10-20 14:23:02 +02:00 · 59529f5142
parent c1fe9158ce
commit 59529f5142
2 changed files with 371 additions and 8 deletions
--- a/docs/Bibliography.org
+++ b/docs/Bibliography.org
@ -5,8 +5,7 @@
 #+OPTIONS: <:nil c:nil todo:nil H:5
 #+auto_tangle: t
 * Deep Learning
-** Transformers
+** Attention is All You Need
 *** Attention is All You Need
 #+begin_src bibtex
@article{https://doi.org/10.48550/arxiv.1706.03762,
  doi             = {10.48550/ARXIV.1706.03762},
@ -25,7 +24,7 @@
 #+end_src
 #+LaTeX: \printbibliography[heading=none]
-*** Axial Attention in Multidimensional Transformers
+** Axial Attention in Multidimensional Transformers
 #+begin_src bibtex
@article{https://doi.org/10.48550/arxiv.1912.12180,
  doi             = {10.48550/ARXIV.1912.12180},
@ -41,7 +40,7 @@
  copyright       = {arXiv.org perpetual, non-exclusive license}
 }
 #+end_src
-*** Longformer: The Long-Document Transformer
+** Longformer: The Long-Document Transformer
 #+begin_src bibtex
@article{https://doi.org/10.48550/arxiv.2004.05150,
  doi             = {10.48550/ARXIV.2004.05150},
@ -55,7 +54,7 @@
  copyright       = {arXiv.org perpetual, non-exclusive license}
 }
 #+end_src
-*** Transformer-XL: Attentive Language Models Beyond a Fixed-Length Context
+** Transformer-XL: Attentive Language Models Beyond a Fixed-Length Context
 #+begin_src bibtex
@article{https://doi.org/10.48550/arxiv.1901.02860,
  doi             = {10.48550/ARXIV.1901.02860},
@ -73,7 +72,7 @@
                  International}
 }
 #+end_src
-*** BERT: Pre-training of Deep Bidirectional Transformers for Language Understanding
+** BERT: Pre-training of Deep Bidirectional Transformers for Language Understanding
 #+begin_src bibtex
@inproceedings{devlin-etal-2019-bert,
  title           = "{BERT}: Pre-training of Deep Bidirectional Transformers for
@ -112,7 +111,7 @@
 #+end_src
 A masked language model (MLM) randomly masks some of the tokens from the input, and the objective is to predict the original input based only on its context.
-*** Fast Transformers with Clustered Attention
+** Fast Transformers with Clustered Attention
 #+begin_src bibtex
@article{https://doi.org/10.48550/arxiv.2007.04825,
  doi             = {10.48550/ARXIV.2007.04825},
@ -128,7 +127,7 @@ A masked language model (MLM) randomly masks some of the tokens from the input,
  copyright       = {arXiv.org perpetual, non-exclusive license}
 }
 #+end_src
-*** The elephant in the interpretability room: Why use attention as explanation when we have saliency methods?
+** The elephant in the interpretability room: Why use attention as explanation when we have saliency methods?
 #+begin_src bibtex
@inproceedings{bastings-filippova-2020-elephant,
  title           = "The elephant in the interpretability room: Why use
@ -160,7 +159,59 @@ A masked language model (MLM) randomly masks some of the tokens from the input,
                  state the goal and user for their explanations.",
 }
 #+end_src
 ** MultiMAE: Multi-modal Multi-task Masked Autoencoders
 #+begin_src bibtex
@article{https://doi.org/10.48550/arxiv.2204.01678,
  doi             = {10.48550/ARXIV.2204.01678},
  url             = {https://arxiv.org/abs/2204.01678},
  author          = {Bachmann, Roman and Mizrahi, David and Atanov, Andrei and
                  Zamir, Amir},
  keywords        = {Computer Vision and Pattern Recognition (cs.CV), Machine
                  Learning (cs.LG), FOS: Computer and information sciences, FOS:
                  Computer and information sciences},
  title           = {MultiMAE: Multi-modal Multi-task Masked Autoencoders},
  publisher       = {arXiv},
  year            = 2022,
  copyright       = {arXiv.org perpetual, non-exclusive license}
 }
 #+end_src
 * Deep Learning + Biology
 ** CpG Transformer for imputation of single-cell methylomes
 #+begin_src bibtex
@article{10.1093/bioinformatics/btab746,
  author          = {De Waele, Gaetan and Clauwaert, Jim and Menschaert, Gerben
                  and Waegeman, Willem},
  title           = "{CpG Transformer for imputation of single-cell methylomes}",
  journal         = {Bioinformatics},
  volume          = 38,
  number          = 3,
  pages           = {597-603},
  year            = 2021,
  month           = 10,
  abstract        = "{The adoption of current single-cell DNA methylation
                  sequencing protocols is hindered by incomplete coverage,
                  outlining the need for effective imputation techniques. The
                  task of imputing single-cell (methylation) data requires
                  models to build an understanding of underlying biological
                  processes.We adapt the transformer neural network architecture
                  to operate on methylation matrices through combining axial
                  attention with sliding window self-attention. The obtained CpG
                  Transformer displays state-of-the-art performances on a wide
                  range of scBS-seq and scRRBS-seq datasets. Furthermore, we
                  demonstrate the interpretability of CpG Transformer and
                  illustrate its rapid transfer learning properties, allowing
                  practitioners to train models on new datasets with a limited
                  computational and time budget.CpG Transformer is freely
                  available at
                  https://github.com/gdewael/cpg-transformer.Supplementary data
                  are available at Bioinformatics online.}",
  issn            = {1367-4803},
  doi             = {10.1093/bioinformatics/btab746},
  url             = {https://doi.org/10.1093/bioinformatics/btab746},
  eprint          =
                  {https://academic.oup.com/bioinformatics/article-pdf/38/3/597/42167564/btab746.pdf},
 }
 #+end_src
 ** MSA Transformer
 #+begin_src bibtex
@article {Rao2021.02.12.430858,
@ -255,4 +306,140 @@ A masked language model (MLM) randomly masks some of the tokens from the input,
  url             = {https://doi.org/10.1038/s41586-021-03819-2}
 }
 #+end_src
 ** MultiVI: deep generative model for the integration of multi-modal data
 #+begin_src bibtex
@article {Ashuach2021.08.20.457057,
  author          = {Ashuach, Tal and Gabitto, Mariano I. and Jordan, Michael I.
                  and Yosef, Nir},
  title           = {MultiVI: deep generative model for the integration of
                  multi-modal data},
  elocation-id    = {2021.08.20.457057},
  year            = 2021,
  doi             = {10.1101/2021.08.20.457057},
  publisher       = {Cold Spring Harbor Laboratory},
  abstract        = {Jointly profiling the transcriptional and chromatin
                  accessibility landscapes of single-cells is a powerful
                  technique to characterize cellular populations. Here we
                  present MultiVI, a probabilistic model to analyze such
                  multiomic data and integrate it with single modality datasets.
                  MultiVI creates a joint representation that accurately
                  reflects both chromatin and transcriptional properties of the
                  cells even when one modality is missing. It also imputes
                  missing data, corrects for batch effects and is available in
                  the scvi-tools framework:
                  https://docs.scvi-tools.org/.Competing Interest StatementThe
                  authors have declared no competing interest.},
  URL             =
                  {https://www.biorxiv.org/content/early/2021/09/07/2021.08.20.457057},
  eprint          =
                  {https://www.biorxiv.org/content/early/2021/09/07/2021.08.20.457057.full.pdf},
  journal         = {bioRxiv}
 }
 #+end_src
 * Biology
 ** Cobolt: integrative analysis of multimodal single-cell sequencing data
 #+begin_src bibtex
@article{Gong2021,
  author          = {Gong, Boying and Zhou, Yun and Purdom, Elizabeth},
  title           = {Cobolt: integrative analysis of multimodal single-cell
                  sequencing data},
  journal         = {Genome Biology},
  year            = 2021,
  month           = {Dec},
  day             = 28,
  volume          = 22,
  number          = 1,
  pages           = 351,
  abstract        = {A growing number of single-cell sequencing platforms enable
                  joint profiling of multiple omics from the same cells. We
                  present Cobolt, a novel method that not only allows for
                  analyzing the data from joint-modality platforms, but provides
                  a coherent framework for the integration of multiple datasets
                  measured on different modalities. We demonstrate its
                  performance on multi-modality data of gene expression and
                  chromatin accessibility and illustrate the integration
                  abilities of Cobolt by jointly analyzing this multi-modality
                  data with single-cell RNA-seq and ATAC-seq datasets.},
  issn            = {1474-760X},
  doi             = {10.1186/s13059-021-02556-z},
  url             = {https://doi.org/10.1186/s13059-021-02556-z}
 }
 #+end_src
 ** MUON: multimodal omics analysis framework
 #+begin_src bibtex
@article{Bredikhin2022,
  author          = {Bredikhin, Danila and Kats, Ilia and Stegle, Oliver},
  title           = {MUON: multimodal omics analysis framework},
  journal         = {Genome Biology},
  year            = 2022,
  month           = {Feb},
  day             = 01,
  volume          = 23,
  number          = 1,
  pages           = 42,
  abstract        = {Advances in multi-omics have led to an explosion of
                  multimodal datasets to address questions from basic biology to
                  translation. While these data provide novel opportunities for
                  discovery, they also pose management and analysis challenges,
                  thus motivating the development of tailored computational
                  solutions. Here, we present a data standard and an analysis
                  framework for multi-omics, MUON, designed to organise,
                  analyse, visualise, and exchange multimodal data. MUON stores
                  multimodal data in an efficient yet flexible and interoperable
                  data structure. MUON enables a versatile range of analyses,
                  from data preprocessing to flexible multi-omics alignment.},
  issn            = {1474-760X},
  doi             = {10.1186/s13059-021-02577-8},
  url             = {https://doi.org/10.1186/s13059-021-02577-8}
 }
 #+end_src
 ** Multimodal single cell data integration challenge: Results and lessons learned
 #+begin_src bibtex
@inproceedings{pmlr-v176-lance22a,
  title           = {Multimodal single cell data integration challenge: Results
                  and lessons learned},
  author          = {Lance, Christopher and Luecken, Malte D. and Burkhardt,
                  Daniel B. and Cannoodt, Robrecht and Rautenstrauch, Pia and
                  Laddach, Anna and Ubingazhibov, Aidyn and Cao, Zhi-Jie and
                  Deng, Kaiwen and Khan, Sumeer and Liu, Qiao and Russkikh,
                  Nikolay and Ryazantsev, Gleb and Ohler, Uwe and data
                  integration competition participants, NeurIPS 2021 Multimodal
                  and Pisco, Angela Oliveira and Bloom, Jonathan and
                  Krishnaswamy, Smita and Theis, Fabian J.},
  booktitle       = {Proceedings of the NeurIPS 2021 Competitions and
                  Demonstrations Track},
  pages           = {162--176},
  year            = 2022,
  editor          = {Kiela, Douwe and Ciccone, Marco and Caputo, Barbara},
  volume          = 176,
  series          = {Proceedings of Machine Learning Research},
  month           = {06--14 Dec},
  publisher       = {PMLR},
  pdf             = {https://proceedings.mlr.press/v176/lance22a/lance22a.pdf},
  url             = {https://proceedings.mlr.press/v176/lance22a.html},
  abstract        = {Biology has become a data-intensive science. Recent
                  technological advances in single-cell genomics have enabled
                  the measurement of multiple facets of cellular state,
                  producing datasets with millions of single-cell observations.
                  While these data hold great promise for understanding
                  molecular mechanisms in health and disease, analysis
                  challenges arising from sparsity, technical and biological
                  variability, and high dimensionality of the data hinder the
                  derivation of such mechanistic insights. To promote the
                  innovation of algorithms for analysis of multimodal
                  single-cell data, we organized a competition at NeurIPS 2021
                  applying the Common Task Framework to multimodal single-cell
                  data integration. For this competition we generated the first
                  multimodal benchmarking dataset for single-cell biology and
                  defined three tasks in this domain: prediction of missing
                  modalities, aligning modalities, and learning a joint
                  representation across modalities. We further specified
                  evaluation metrics and developed a cloud-based algorithm
                  evaluation pipeline. Using this setup, 280 competitors
                  submitted over 2600 proposed solutions within a 3 month
                  period, showcasing substantial innovation especially in the
                  modality alignment task. Here, we present the results,
                  describe trends of well performing approaches, and discuss
                  challenges associated with running the competition.}
 }
 #+end_src
--- a/docs/bibliography.bib
+++ b/docs/bibliography.bib
@ -134,6 +134,54 @@
                  state the goal and user for their explanations.",
 }
@article{https://doi.org/10.48550/arxiv.2204.01678,
  doi             = {10.48550/ARXIV.2204.01678},
  url             = {https://arxiv.org/abs/2204.01678},
  author          = {Bachmann, Roman and Mizrahi, David and Atanov, Andrei and
                  Zamir, Amir},
  keywords        = {Computer Vision and Pattern Recognition (cs.CV), Machine
                  Learning (cs.LG), FOS: Computer and information sciences, FOS:
                  Computer and information sciences},
  title           = {MultiMAE: Multi-modal Multi-task Masked Autoencoders},
  publisher       = {arXiv},
  year            = 2022,
  copyright       = {arXiv.org perpetual, non-exclusive license}
 }
@article{10.1093/bioinformatics/btab746,
  author          = {De Waele, Gaetan and Clauwaert, Jim and Menschaert, Gerben
                  and Waegeman, Willem},
  title           = "{CpG Transformer for imputation of single-cell methylomes}",
  journal         = {Bioinformatics},
  volume          = 38,
  number          = 3,
  pages           = {597-603},
  year            = 2021,
  month           = 10,
  abstract        = "{The adoption of current single-cell DNA methylation
                  sequencing protocols is hindered by incomplete coverage,
                  outlining the need for effective imputation techniques. The
                  task of imputing single-cell (methylation) data requires
                  models to build an understanding of underlying biological
                  processes.We adapt the transformer neural network architecture
                  to operate on methylation matrices through combining axial
                  attention with sliding window self-attention. The obtained CpG
                  Transformer displays state-of-the-art performances on a wide
                  range of scBS-seq and scRRBS-seq datasets. Furthermore, we
                  demonstrate the interpretability of CpG Transformer and
                  illustrate its rapid transfer learning properties, allowing
                  practitioners to train models on new datasets with a limited
                  computational and time budget.CpG Transformer is freely
                  available at
                  https://github.com/gdewael/cpg-transformer.Supplementary data
                  are available at Bioinformatics online.}",
  issn            = {1367-4803},
  doi             = {10.1093/bioinformatics/btab746},
  url             = {https://doi.org/10.1093/bioinformatics/btab746},
  eprint          =
                  {https://academic.oup.com/bioinformatics/article-pdf/38/3/597/42167564/btab746.pdf},
 }
@article {Rao2021.02.12.430858,
  author          = {Rao, Roshan and Liu, Jason and Verkuil, Robert and Meier,
                  Joshua and Canny, John F. and Abbeel, Pieter and Sercu, Tom
@ -223,3 +271,131 @@
  doi             = {10.1038/s41586-021-03819-2},
  url             = {https://doi.org/10.1038/s41586-021-03819-2}
 }
@article {Ashuach2021.08.20.457057,
  author          = {Ashuach, Tal and Gabitto, Mariano I. and Jordan, Michael I.
                  and Yosef, Nir},
  title           = {MultiVI: deep generative model for the integration of
                  multi-modal data},
  elocation-id    = {2021.08.20.457057},
  year            = 2021,
  doi             = {10.1101/2021.08.20.457057},
  publisher       = {Cold Spring Harbor Laboratory},
  abstract        = {Jointly profiling the transcriptional and chromatin
                  accessibility landscapes of single-cells is a powerful
                  technique to characterize cellular populations. Here we
                  present MultiVI, a probabilistic model to analyze such
                  multiomic data and integrate it with single modality datasets.
                  MultiVI creates a joint representation that accurately
                  reflects both chromatin and transcriptional properties of the
                  cells even when one modality is missing. It also imputes
                  missing data, corrects for batch effects and is available in
                  the scvi-tools framework:
                  https://docs.scvi-tools.org/.Competing Interest StatementThe
                  authors have declared no competing interest.},
  URL             =
                  {https://www.biorxiv.org/content/early/2021/09/07/2021.08.20.457057},
  eprint          =
                  {https://www.biorxiv.org/content/early/2021/09/07/2021.08.20.457057.full.pdf},
  journal         = {bioRxiv}
 }
@article{Gong2021,
  author          = {Gong, Boying and Zhou, Yun and Purdom, Elizabeth},
  title           = {Cobolt: integrative analysis of multimodal single-cell
                  sequencing data},
  journal         = {Genome Biology},
  year            = 2021,
  month           = {Dec},
  day             = 28,
  volume          = 22,
  number          = 1,
  pages           = 351,
  abstract        = {A growing number of single-cell sequencing platforms enable
                  joint profiling of multiple omics from the same cells. We
                  present Cobolt, a novel method that not only allows for
                  analyzing the data from joint-modality platforms, but provides
                  a coherent framework for the integration of multiple datasets
                  measured on different modalities. We demonstrate its
                  performance on multi-modality data of gene expression and
                  chromatin accessibility and illustrate the integration
                  abilities of Cobolt by jointly analyzing this multi-modality
                  data with single-cell RNA-seq and ATAC-seq datasets.},
  issn            = {1474-760X},
  doi             = {10.1186/s13059-021-02556-z},
  url             = {https://doi.org/10.1186/s13059-021-02556-z}
 }
@article{Bredikhin2022,
  author          = {Bredikhin, Danila and Kats, Ilia and Stegle, Oliver},
  title           = {MUON: multimodal omics analysis framework},
  journal         = {Genome Biology},
  year            = 2022,
  month           = {Feb},
  day             = 01,
  volume          = 23,
  number          = 1,
  pages           = 42,
  abstract        = {Advances in multi-omics have led to an explosion of
                  multimodal datasets to address questions from basic biology to
                  translation. While these data provide novel opportunities for
                  discovery, they also pose management and analysis challenges,
                  thus motivating the development of tailored computational
                  solutions. Here, we present a data standard and an analysis
                  framework for multi-omics, MUON, designed to organise,
                  analyse, visualise, and exchange multimodal data. MUON stores
                  multimodal data in an efficient yet flexible and interoperable
                  data structure. MUON enables a versatile range of analyses,
                  from data preprocessing to flexible multi-omics alignment.},
  issn            = {1474-760X},
  doi             = {10.1186/s13059-021-02577-8},
  url             = {https://doi.org/10.1186/s13059-021-02577-8}
 }
@inproceedings{pmlr-v176-lance22a,
  title           = {Multimodal single cell data integration challenge: Results
                  and lessons learned},
  author          = {Lance, Christopher and Luecken, Malte D. and Burkhardt,
                  Daniel B. and Cannoodt, Robrecht and Rautenstrauch, Pia and
                  Laddach, Anna and Ubingazhibov, Aidyn and Cao, Zhi-Jie and
                  Deng, Kaiwen and Khan, Sumeer and Liu, Qiao and Russkikh,
                  Nikolay and Ryazantsev, Gleb and Ohler, Uwe and data
                  integration competition participants, NeurIPS 2021 Multimodal
                  and Pisco, Angela Oliveira and Bloom, Jonathan and
                  Krishnaswamy, Smita and Theis, Fabian J.},
  booktitle       = {Proceedings of the NeurIPS 2021 Competitions and
                  Demonstrations Track},
  pages           = {162--176},
  year            = 2022,
  editor          = {Kiela, Douwe and Ciccone, Marco and Caputo, Barbara},
  volume          = 176,
  series          = {Proceedings of Machine Learning Research},
  month           = {06--14 Dec},
  publisher       = {PMLR},
  pdf             = {https://proceedings.mlr.press/v176/lance22a/lance22a.pdf},
  url             = {https://proceedings.mlr.press/v176/lance22a.html},
  abstract        = {Biology has become a data-intensive science. Recent
                  technological advances in single-cell genomics have enabled
                  the measurement of multiple facets of cellular state,
                  producing datasets with millions of single-cell observations.
                  While these data hold great promise for understanding
                  molecular mechanisms in health and disease, analysis
                  challenges arising from sparsity, technical and biological
                  variability, and high dimensionality of the data hinder the
                  derivation of such mechanistic insights. To promote the
                  innovation of algorithms for analysis of multimodal
                  single-cell data, we organized a competition at NeurIPS 2021
                  applying the Common Task Framework to multimodal single-cell
                  data integration. For this competition we generated the first
                  multimodal benchmarking dataset for single-cell biology and
                  defined three tasks in this domain: prediction of missing
                  modalities, aligning modalities, and learning a joint
                  representation across modalities. We further specified
                  evaluation metrics and developed a cloud-based algorithm
                  evaluation pipeline. Using this setup, 280 competitors
                  submitted over 2600 proposed solutions within a 3 month
                  period, showcasing substantial innovation especially in the
                  modality alignment task. Here, we present the results,
                  describe trends of well performing approaches, and discuss
                  challenges associated with running the competition.}
 }