diff --git a/_data/single-cell-transformers.yml b/_data/single-cell-transformers.yml index 6e6c2c5..b5816e3 100644 --- a/_data/single-cell-transformers.yml +++ b/_data/single-cell-transformers.yml @@ -1,3 +1,361 @@ +- model: scGREAT + paper: + type: peer_reviewed + text: '[Yuchen Wang et al. 2024](https://www.cell.com/iscience/pdf/S2589-0042%2824%2900573-X.pdf)' + url: https://www.cell.com/iscience/pdf/S2589-0042%2824%2900573-X.pdf + code: + type: reproducible + text: "[ð\x9F\x9B\_ï¸\x8FGitHub](https://github.com/WangyuchenCS/scGREAT)" + url: https://github.com/WangyuchenCS/scGREAT + omic_modalities: '-' + pre_training_dataset: '-' + input_embedding: '-' + architecture: '-' + ssl_tasks: '-' + supervised_tasks: '-' + +- model: Nicheformer + paper: + type: peer_reviewed + text: '[Anna C. Schaar et al. 2024](https://papers.ssrn.com/sol3/papers.cfm?abstract_id=4803291)' + url: https://papers.ssrn.com/sol3/papers.cfm?abstract_id=4803291 + code: + type: reproducible + text: "[ð\x9F\x9B\_ï¸\x8FGitHub](https://github.com/theislab/nicheformer)" + url: https://github.com/theislab/nicheformer + omic_modalities: '-' + pre_training_dataset: '-' + input_embedding: '-' + architecture: '-' + ssl_tasks: '-' + supervised_tasks: '-' + +- model: scmFormer + paper: + type: preprint + text: '[Jing Xu et al. 2024](https://pmc.ncbi.nlm.nih.gov/articles/PMC11109621/)' + url: https://pmc.ncbi.nlm.nih.gov/articles/PMC11109621/ + code: + type: evaluation_only + text: "[ð\x9F\x94\x8DGitHub](https://github.com/zhanglab-wbgcas/scmFormer)" + url: https://github.com/zhanglab-wbgcas/scmFormer + omic_modalities: '-' + pre_training_dataset: '-' + input_embedding: '-' + architecture: '-' + ssl_tasks: '-' + supervised_tasks: '-' + +- model: Metric Mirages + paper: + type: preprint + text: '[Hanchen Wang et al. 2024](https://www.biorxiv.org/content/10.1101/2024.04.02.587824v1.full.pdf)' + url: https://www.biorxiv.org/content/10.1101/2024.04.02.587824v1.full.pdf + code: + type: '-' + text: '-' + url: '-' + omic_modalities: '-' + pre_training_dataset: '-' + input_embedding: '-' + architecture: '-' + ssl_tasks: '-' + supervised_tasks: '-' + +- model: scEmb + paper: + type: preprint + text: '[Kang-Lin Hsieh et al. 2024](https://www.biorxiv.org/content/10.1101/2024.09.24.614685v1)' + url: https://www.biorxiv.org/content/10.1101/2024.09.24.614685v1 + code: + type: '-' + text: '-' + url: '-' + omic_modalities: '-' + pre_training_dataset: '-' + input_embedding: '-' + architecture: '-' + ssl_tasks: '-' + supervised_tasks: '-' + + + +- model: Cell-ontology guided transcriptome foundation model + paper: + type: preprint + text: '[Xinyu Yuan et al. 2024](https://arxiv.org/pdf/2408.12373)' + url: https://arxiv.org/pdf/2408.12373 + code: + type: '-' + text: "[](https://github.com/zhanglab-wbgcas/scmFormer)" + url: 'https://github.com/DeepGraphLearning/scCello' + omic_modalities: '-' + pre_training_dataset: '-' + input_embedding: '-' + architecture: '-' + ssl_tasks: '-' + supervised_tasks: '-' + +- model: Cell-Graph Compass + paper: + type: preprint + text: '[Chen Fang et al. 2024](https://www.biorxiv.org/content/10.1101/2024.06.04.597354v1.full.pdf)' + url: https://www.biorxiv.org/content/10.1101/2024.06.04.597354v1.full.pdf + code: + type: 'reproducible' + text: "[ð\x9F\x9B\_ï¸\x8FGitHub](https://github.com/epang-ucas/Cell-Graph-Compass)" + url: 'https://github.com/epang-ucas/Cell-Graph-Compass' + omic_modalities: '-' + pre_training_dataset: '-' + input_embedding: '-' + architecture: '-' + ssl_tasks: '-' + supervised_tasks: '-' + +- model: scGAA + paper: + type: peer_reviewed + text: '[Tianci Kong et al. 2024](https://www.nature.com/articles/s41598-024-73356-1)' + url: https://www.nature.com/articles/s41598-024-73356-1 + code: + type: 'evaluation_only' + text: "[ð\x9F\x94\x8DGitHub]https://github.com/kongtianci/scGAA)" + url: 'https://github.com/kongtianci/scGAA' + omic_modalities: '-' + pre_training_dataset: '-' + input_embedding: '-' + architecture: '-' + ssl_tasks: '-' + supervised_tasks: '-' + +- model: scFusionTTT + paper: + type: preprint + text: '[Dian Meng et al. 2024](https://openreview.net/forum?id=7rR6RAUaoC)' + url: https://openreview.net/forum?id=7rR6RAUaoC + code: + type: '-' + text: '-' + url: '-' + omic_modalities: '-' + pre_training_dataset: '-' + input_embedding: '-' + architecture: '-' + ssl_tasks: '-' + supervised_tasks: '-' + + +- model: scCello + paper: + type: preprint + text: '[Xinyu Yuan et al. 2024](https://github.com/theislab/single-cell-transformer-papers/issues/32)' + url: https://github.com/theislab/single-cell-transformer-papers/issues/32 + code: + type: '-' + text: "[ð\x9F\x94\x8DGitHub](https://github.com/DeepGraphLearning/scCello)" + url: 'https://github.com/DeepGraphLearning/scCello' + omic_modalities: '-' + pre_training_dataset: '-' + input_embedding: '-' + architecture: '-' + ssl_tasks: '-' + supervised_tasks: '-' + +- model: scGenePT + paper: + type: preprint + text: '[Ana-Maria Istrate et al. 2024](https://www.biorxiv.org/content/10.1101/2024.10.23.619972v1.full.pdf)' + url: https://www.biorxiv.org/content/10.1101/2024.10.23.619972v1.full.pdf + code: + type: 'reproducible' + text: "[ð\x9F\x9B\_ï¸\x8FGitHub](https://github.com/czi-ai/scGenePT)" + url: 'https://github.com/czi-ai/scGenePT' + omic_modalities: '-' + pre_training_dataset: '-' + input_embedding: '-' + architecture: '-' + ssl_tasks: '-' + supervised_tasks: '-' + +- model: ENHANCING GENERATIVE PERTURBATION MODELS WITH LLM-INFORMED GENE EMBEDDINGS + paper: + type: preprint + text: '[Kaspar Märtens et al. 2024](https://openreview.net/pdf?id=eb3ndUlkt4)' + url: https://openreview.net/pdf?id=eb3ndUlkt4 + code: + type: '-' + text: "-" + url: '-' + omic_modalities: '-' + pre_training_dataset: '-' + input_embedding: '-' + architecture: '-' + ssl_tasks: '-' + supervised_tasks: '-' + +- model: scSwinTNet + paper: + type: peer_reviewed + text: '[Huanhuan Dai et al. 2024](https://ieeexplore.ieee.org/stamp/stamp.jsp?tp=&arnumber=10737051)' + url: https://ieeexplore.ieee.org/stamp/stamp.jsp?tp=&arnumber=10737051 + code: + type: 'reproducible' + text: "[ð\x9F\x9B\_ï¸\x8FGitHub](https://github.com/Danica123/scSwinTNet)" + url: 'https://github.com/Danica123/scSwinTNet' + omic_modalities: '-' + pre_training_dataset: '-' + input_embedding: '-' + architecture: '-' + ssl_tasks: '-' + supervised_tasks: '-' + +- model: sclong + paper: + type: preprint + text: '[Ding Bai et al. 2024](https://www.biorxiv.org/content/10.1101/2024.11.09.622759v2)' + url: https://www.biorxiv.org/content/10.1101/2024.11.09.622759v2 + code: + type: 'reproducible' + text: "[ð\x9F\x9B\_ï¸\x8FGitHub](https://github.com/BaiDing1234/scLong)" + url: 'https://github.com/BaiDing1234/scLong' + omic_modalities: '-' + pre_training_dataset: '-' + input_embedding: '-' + architecture: '-' + ssl_tasks: '-' + supervised_tasks: '-' + +- model: WHITE-BOX DIFFUSION TRANSFORMER FOR SINGLE-CELL RNA-SEQ GENERATION + paper: + type: preprint + text: '[Zhuorui Cui et al. 2024](https://arxiv.org/pdf/2411.06785)' + url: https://arxiv.org/pdf/2411.06785 + code: + type: '-' + text: '-' + url: '-' + omic_modalities: '-' + pre_training_dataset: '-' + input_embedding: '-' + architecture: '-' + ssl_tasks: '-' + supervised_tasks: '-' + +- model: "A framework for gene representation on spatial transcriptomics" + paper: + type: preprint + text: '[Shenghao Cao et al. 2024](https://www.biorxiv.org/content/10.1101/2024.09.27.615337v5.full)' + url: https://www.biorxiv.org/content/10.1101/2024.09.27.615337v5.full + code: + type: '-' + text: '-' + url: '-' + omic_modalities: '-' + pre_training_dataset: '-' + input_embedding: '-' + architecture: '-' + ssl_tasks: '-' + supervised_tasks: '-' + + +- model: genohoption + paper: + type: preprint + text: '[Jiabei Cheng et al. 2024](https://arxiv.org/pdf/2411.06331)' + url: https://arxiv.org/pdf/2411.06331 + code: + type: 'reproducible' + text: "[ð\x9F\x9B\_ï¸\x8FGitHub](https://github.com/Bunnybeibei/GenoHoption)" + url: 'https://github.com/Bunnybeibei/GenoHoption' + omic_modalities: '-' + pre_training_dataset: '-' + input_embedding: '-' + architecture: '-' + ssl_tasks: '-' + supervised_tasks: '-' + +- model: Cellpatch + paper: + type: preprint + text: '[Hanwen Zhu et al. 2024](https://www.biorxiv.org/content/10.1101/2024.11.15.623701v1.full.pdf)' + url: https://www.biorxiv.org/content/10.1101/2024.11.15.623701v1.full.pdf + code: + type: 'reproducible' + text: '[ð\x9F\x9B\_ï¸\x8FGitHub](https://github.com/HanwenZhu98/CellPatch)' + url: 'https://github.com/HanwenZhu98/CellPatch' + omic_modalities: '-' + pre_training_dataset: '-' + input_embedding: '-' + architecture: '-' + ssl_tasks: '-' + supervised_tasks: '-' + +- model: GRNPT + paper: + type: preprint + text: '[Guangzheng Weng et al. 2024](https://advanced.onlinelibrary.wiley.com/doi/pdf/10.1002/advs.202409990)' + url: https://advanced.onlinelibrary.wiley.com/doi/pdf/10.1002/advs.202409990 + code: + type: 'evaluation_only' + text: '[ð\x9F\x94\x8DGitHub](https://github.com/wgzgithub/GRNPT)' + url: 'https://github.com/wgzgithub/GRNPT' + omic_modalities: '-' + pre_training_dataset: '-' + input_embedding: '-' + architecture: '-' + ssl_tasks: '-' + supervised_tasks: '-' + + +- model: Aido.cell + paper: + type: preprint + text: '[Nicholas Ho et al. 2024](https://www.biorxiv.org/content/10.1101/2024.11.28.625303v1.full)' + url: https://www.biorxiv.org/content/10.1101/2024.11.28.625303v1.full + code: + type: 'evaluation_only' + text: '[ð\x9F\x94\x8DGitHub](https://github.com/wgzgithub/GRNPT)' + url: 'https://huggingface.co/genbio-ai/AIDO.Cell-100M/tree/main' + omic_modalities: '-' + pre_training_dataset: '-' + input_embedding: '-' + architecture: '-' + ssl_tasks: '-' + supervised_tasks: '-' + +- model: sctel + paper: + type: peer_reviewed + text: '[Yuanyuan Chen et al. 2024](https://www.nature.com/articles/s41540-024-00484-9)' + url: https://www.nature.com/articles/s41540-024-00484-9 + code: + type: 'reproducible' + text: '[ð\x9F\x9B\_ï¸\x8FGitHub](https://github.com/142857cyy/scTEL)' + u'rl: 'https://github.com/142857cyy/scTEL' + omic_modalities: '-' + pre_training_dataset: '-' + input_embedding: '-' + architecture: '-' + ssl_tasks: '-' + supervised_tasks: '-' + + +- model: "Toward a privacy-preserving predictive foundation model" + paper: + type: preprint + text: '[Jiayuan Ding et al. 2024](https://www.biorxiv.org/content/10.1101/2025.01.06.631427v1.full.pdf)' + url: https://www.biorxiv.org/content/10.1101/2025.01.06.631427v1.full.pdf + code: + type: '-' + text: '-' + url: '-' + omic_modalities: '-' + pre_training_dataset: '-' + input_embedding: '-' + architecture: '-' + ssl_tasks: '-' + supervised_tasks: '-' + - model: mcBERT paper: type: preprint diff --git a/_data/transformer-evaluation.yml b/_data/transformer-evaluation.yml index db9503f..3dc4986 100644 --- a/_data/transformer-evaluation.yml +++ b/_data/transformer-evaluation.yml @@ -1,3 +1,103 @@ +- paper: + type: preprint + text: '[Kaspar Märtens et al. 2024](https://openreview.net/pdf?id=eb3ndUlkt4)' + url: https://openreview.net/pdf?id=eb3ndUlkt4 + code: + type: 'reproducible' + text: '[ð\x9F\x9B\_ï¸\x8FGitHub](https://github.com/valence-labs/Tx-Evaluation)' + url: 'https://github.com/valence-labs/Tx-Evaluation' + omic_modalities: '-' + evaluated_transformers: '-' + tasks: '-' + notes: '-' + + + +- paper: + type: preprint + text: '[Ihab Bendidi et al. 2024](https://arxiv.org/pdf/2410.13956)' + url: https://arxiv.org/pdf/2410.13956 + code: + type: 'reproducible' + text: '[ð\x9F\x9B\_ï¸\x8FGitHub](https://github.com/valence-labs/Tx-Evaluation)' + url: 'https://github.com/valence-labs/Tx-Evaluation' + omic_modalities: '-' + evaluated_transformers: '-' + tasks: '-' + notes: '-' + + +- paper: + type: preprint + text: '[George Crowley et al. 2024](https://www.biorxiv.org/content/10.1101/2024.10.10.617605v1.full.pdf)' + url: https://www.biorxiv.org/content/10.1101/2024.10.10.617605v1.full.pdf + code: + type: 'reproducible' + text: '[ð\x9F\x9B\_ï¸\x8FGitHub](https://github.com/ggit12/anndictionary/)' + url: 'https://github.com/ggit12/anndictionary/' + omic_modalities: '-' + evaluated_transformers: '-' + tasks: '-' + notes: '-' + + + +- paper: + type: preprint + text: '[George Crowley et al. 2024](https://www.biorxiv.org/content/10.1101/2024.10.10.617605v1.full.pdf)' + url: https://www.biorxiv.org/content/10.1101/2024.10.10.617605v1.full.pdf + code: + type: 'reproducible' + text: '[ð\x9F\x9B\_ï¸\x8FGitHub](https://github.com/ggit12/anndictionary/)' + url: 'https://github.com/ggit12/anndictionary/' + omic_modalities: '-' + evaluated_transformers: '-' + tasks: '-' + notes: '-' + + +- paper: + type: preprint + text: '[Yan Wu et al. 2024](https://scholar.google.com/scholar?cluster=18315006149844520972&hl=en&as_sdt=0,5)' + url: https://scholar.google.com/scholar?cluster=18315006149844520972&hl=en&as_sdt=0,5 + code: + type: 'reproducible' + text: '[ð\x9F\x9B\_ï¸\x8FGitHub](https://github.com/altoslabs/perturbench)' + url: 'https://github.com/altoslabs/perturbench' + omic_modalities: '-' + evaluated_transformers: '-' + tasks: '-' + notes: '-' + +- paper: + type: preprint + text: '[A. Wenteler et al. 2024](https://www.biorxiv.org/content/10.1101/2024.10.02.616248v1.abstract)' + url: https://www.biorxiv.org/content/10.1101/2024.10.02.616248v1.abstract + code: + type: 'reproducible' + text: '[ð\x9F\x9B\_ï¸\x8FGitHub](https://github.com/aaronwtr/PertEval)' + url: 'https://github.com/aaronwtr/PertEval' + omic_modalities: '-' + evaluated_transformers: '-' + tasks: '-' + notes: '-' + + + +- paper: + type: preprint + text: '[Eric Kernfeld et al. 2024](https://www.biorxiv.org/content/10.1101/2023.07.28.551039v2.full)' + url: https://www.biorxiv.org/content/10.1101/2023.07.28.551039v2.full + code: + type: 'reproducible' + text: '[ð\x9F\x9B\_ï¸\x8FGitHub](https://github.com/ekernf01/perturbation_benchmarking)' + url: 'https://github.com/ekernf01/perturbation_benchmarking' + omic_modalities: '-' + evaluated_transformers: '-' + tasks: '-' + notes: '-' + + - paper: type: preprint text: '[Yoav Kan-Tor et al. 2024](https://arxiv.org/abs/2412.04075)' diff --git a/_data/transformer-llms.yml b/_data/transformer-llms.yml index f01e8a6..978c6c7 100644 --- a/_data/transformer-llms.yml +++ b/_data/transformer-llms.yml @@ -1,3 +1,20 @@ +- model: stFormer + paper: + type: preprint + text: '[Shenghao Cao et al. 2024](https://www.biorxiv.org/content/10.1101/2024.09.27.615337v1)' + url: https://www.biorxiv.org/content/10.1101/2024.09.27.615337v1 + code: + type: 'reproducible' + text: "[ð\x9F\x94\x8DGitHub](https://github.com/ucaswangls/STFormer)" + url: 'https://github.com/ucaswangls/STFormer' + omic_modalities: '-' + pre_training_dataset: '-' + input_embedding: '-' + architecture: '-' + ssl_tasks: '-' + supervised_tasks: '-' + + - model: scChat paper: type: preprint diff --git a/_site/_data/single-cell-transformers.yml b/_site/_data/single-cell-transformers.yml index 10d0c96..b5816e3 100644 --- a/_site/_data/single-cell-transformers.yml +++ b/_site/_data/single-cell-transformers.yml @@ -1,3 +1,391 @@ +- model: scGREAT + paper: + type: peer_reviewed + text: '[Yuchen Wang et al. 2024](https://www.cell.com/iscience/pdf/S2589-0042%2824%2900573-X.pdf)' + url: https://www.cell.com/iscience/pdf/S2589-0042%2824%2900573-X.pdf + code: + type: reproducible + text: "[ð\x9F\x9B\_ï¸\x8FGitHub](https://github.com/WangyuchenCS/scGREAT)" + url: https://github.com/WangyuchenCS/scGREAT + omic_modalities: '-' + pre_training_dataset: '-' + input_embedding: '-' + architecture: '-' + ssl_tasks: '-' + supervised_tasks: '-' + +- model: Nicheformer + paper: + type: peer_reviewed + text: '[Anna C. Schaar et al. 2024](https://papers.ssrn.com/sol3/papers.cfm?abstract_id=4803291)' + url: https://papers.ssrn.com/sol3/papers.cfm?abstract_id=4803291 + code: + type: reproducible + text: "[ð\x9F\x9B\_ï¸\x8FGitHub](https://github.com/theislab/nicheformer)" + url: https://github.com/theislab/nicheformer + omic_modalities: '-' + pre_training_dataset: '-' + input_embedding: '-' + architecture: '-' + ssl_tasks: '-' + supervised_tasks: '-' + +- model: scmFormer + paper: + type: preprint + text: '[Jing Xu et al. 2024](https://pmc.ncbi.nlm.nih.gov/articles/PMC11109621/)' + url: https://pmc.ncbi.nlm.nih.gov/articles/PMC11109621/ + code: + type: evaluation_only + text: "[ð\x9F\x94\x8DGitHub](https://github.com/zhanglab-wbgcas/scmFormer)" + url: https://github.com/zhanglab-wbgcas/scmFormer + omic_modalities: '-' + pre_training_dataset: '-' + input_embedding: '-' + architecture: '-' + ssl_tasks: '-' + supervised_tasks: '-' + +- model: Metric Mirages + paper: + type: preprint + text: '[Hanchen Wang et al. 2024](https://www.biorxiv.org/content/10.1101/2024.04.02.587824v1.full.pdf)' + url: https://www.biorxiv.org/content/10.1101/2024.04.02.587824v1.full.pdf + code: + type: '-' + text: '-' + url: '-' + omic_modalities: '-' + pre_training_dataset: '-' + input_embedding: '-' + architecture: '-' + ssl_tasks: '-' + supervised_tasks: '-' + +- model: scEmb + paper: + type: preprint + text: '[Kang-Lin Hsieh et al. 2024](https://www.biorxiv.org/content/10.1101/2024.09.24.614685v1)' + url: https://www.biorxiv.org/content/10.1101/2024.09.24.614685v1 + code: + type: '-' + text: '-' + url: '-' + omic_modalities: '-' + pre_training_dataset: '-' + input_embedding: '-' + architecture: '-' + ssl_tasks: '-' + supervised_tasks: '-' + + + +- model: Cell-ontology guided transcriptome foundation model + paper: + type: preprint + text: '[Xinyu Yuan et al. 2024](https://arxiv.org/pdf/2408.12373)' + url: https://arxiv.org/pdf/2408.12373 + code: + type: '-' + text: "[](https://github.com/zhanglab-wbgcas/scmFormer)" + url: 'https://github.com/DeepGraphLearning/scCello' + omic_modalities: '-' + pre_training_dataset: '-' + input_embedding: '-' + architecture: '-' + ssl_tasks: '-' + supervised_tasks: '-' + +- model: Cell-Graph Compass + paper: + type: preprint + text: '[Chen Fang et al. 2024](https://www.biorxiv.org/content/10.1101/2024.06.04.597354v1.full.pdf)' + url: https://www.biorxiv.org/content/10.1101/2024.06.04.597354v1.full.pdf + code: + type: 'reproducible' + text: "[ð\x9F\x9B\_ï¸\x8FGitHub](https://github.com/epang-ucas/Cell-Graph-Compass)" + url: 'https://github.com/epang-ucas/Cell-Graph-Compass' + omic_modalities: '-' + pre_training_dataset: '-' + input_embedding: '-' + architecture: '-' + ssl_tasks: '-' + supervised_tasks: '-' + +- model: scGAA + paper: + type: peer_reviewed + text: '[Tianci Kong et al. 2024](https://www.nature.com/articles/s41598-024-73356-1)' + url: https://www.nature.com/articles/s41598-024-73356-1 + code: + type: 'evaluation_only' + text: "[ð\x9F\x94\x8DGitHub]https://github.com/kongtianci/scGAA)" + url: 'https://github.com/kongtianci/scGAA' + omic_modalities: '-' + pre_training_dataset: '-' + input_embedding: '-' + architecture: '-' + ssl_tasks: '-' + supervised_tasks: '-' + +- model: scFusionTTT + paper: + type: preprint + text: '[Dian Meng et al. 2024](https://openreview.net/forum?id=7rR6RAUaoC)' + url: https://openreview.net/forum?id=7rR6RAUaoC + code: + type: '-' + text: '-' + url: '-' + omic_modalities: '-' + pre_training_dataset: '-' + input_embedding: '-' + architecture: '-' + ssl_tasks: '-' + supervised_tasks: '-' + + +- model: scCello + paper: + type: preprint + text: '[Xinyu Yuan et al. 2024](https://github.com/theislab/single-cell-transformer-papers/issues/32)' + url: https://github.com/theislab/single-cell-transformer-papers/issues/32 + code: + type: '-' + text: "[ð\x9F\x94\x8DGitHub](https://github.com/DeepGraphLearning/scCello)" + url: 'https://github.com/DeepGraphLearning/scCello' + omic_modalities: '-' + pre_training_dataset: '-' + input_embedding: '-' + architecture: '-' + ssl_tasks: '-' + supervised_tasks: '-' + +- model: scGenePT + paper: + type: preprint + text: '[Ana-Maria Istrate et al. 2024](https://www.biorxiv.org/content/10.1101/2024.10.23.619972v1.full.pdf)' + url: https://www.biorxiv.org/content/10.1101/2024.10.23.619972v1.full.pdf + code: + type: 'reproducible' + text: "[ð\x9F\x9B\_ï¸\x8FGitHub](https://github.com/czi-ai/scGenePT)" + url: 'https://github.com/czi-ai/scGenePT' + omic_modalities: '-' + pre_training_dataset: '-' + input_embedding: '-' + architecture: '-' + ssl_tasks: '-' + supervised_tasks: '-' + +- model: ENHANCING GENERATIVE PERTURBATION MODELS WITH LLM-INFORMED GENE EMBEDDINGS + paper: + type: preprint + text: '[Kaspar Märtens et al. 2024](https://openreview.net/pdf?id=eb3ndUlkt4)' + url: https://openreview.net/pdf?id=eb3ndUlkt4 + code: + type: '-' + text: "-" + url: '-' + omic_modalities: '-' + pre_training_dataset: '-' + input_embedding: '-' + architecture: '-' + ssl_tasks: '-' + supervised_tasks: '-' + +- model: scSwinTNet + paper: + type: peer_reviewed + text: '[Huanhuan Dai et al. 2024](https://ieeexplore.ieee.org/stamp/stamp.jsp?tp=&arnumber=10737051)' + url: https://ieeexplore.ieee.org/stamp/stamp.jsp?tp=&arnumber=10737051 + code: + type: 'reproducible' + text: "[ð\x9F\x9B\_ï¸\x8FGitHub](https://github.com/Danica123/scSwinTNet)" + url: 'https://github.com/Danica123/scSwinTNet' + omic_modalities: '-' + pre_training_dataset: '-' + input_embedding: '-' + architecture: '-' + ssl_tasks: '-' + supervised_tasks: '-' + +- model: sclong + paper: + type: preprint + text: '[Ding Bai et al. 2024](https://www.biorxiv.org/content/10.1101/2024.11.09.622759v2)' + url: https://www.biorxiv.org/content/10.1101/2024.11.09.622759v2 + code: + type: 'reproducible' + text: "[ð\x9F\x9B\_ï¸\x8FGitHub](https://github.com/BaiDing1234/scLong)" + url: 'https://github.com/BaiDing1234/scLong' + omic_modalities: '-' + pre_training_dataset: '-' + input_embedding: '-' + architecture: '-' + ssl_tasks: '-' + supervised_tasks: '-' + +- model: WHITE-BOX DIFFUSION TRANSFORMER FOR SINGLE-CELL RNA-SEQ GENERATION + paper: + type: preprint + text: '[Zhuorui Cui et al. 2024](https://arxiv.org/pdf/2411.06785)' + url: https://arxiv.org/pdf/2411.06785 + code: + type: '-' + text: '-' + url: '-' + omic_modalities: '-' + pre_training_dataset: '-' + input_embedding: '-' + architecture: '-' + ssl_tasks: '-' + supervised_tasks: '-' + +- model: "A framework for gene representation on spatial transcriptomics" + paper: + type: preprint + text: '[Shenghao Cao et al. 2024](https://www.biorxiv.org/content/10.1101/2024.09.27.615337v5.full)' + url: https://www.biorxiv.org/content/10.1101/2024.09.27.615337v5.full + code: + type: '-' + text: '-' + url: '-' + omic_modalities: '-' + pre_training_dataset: '-' + input_embedding: '-' + architecture: '-' + ssl_tasks: '-' + supervised_tasks: '-' + + +- model: genohoption + paper: + type: preprint + text: '[Jiabei Cheng et al. 2024](https://arxiv.org/pdf/2411.06331)' + url: https://arxiv.org/pdf/2411.06331 + code: + type: 'reproducible' + text: "[ð\x9F\x9B\_ï¸\x8FGitHub](https://github.com/Bunnybeibei/GenoHoption)" + url: 'https://github.com/Bunnybeibei/GenoHoption' + omic_modalities: '-' + pre_training_dataset: '-' + input_embedding: '-' + architecture: '-' + ssl_tasks: '-' + supervised_tasks: '-' + +- model: Cellpatch + paper: + type: preprint + text: '[Hanwen Zhu et al. 2024](https://www.biorxiv.org/content/10.1101/2024.11.15.623701v1.full.pdf)' + url: https://www.biorxiv.org/content/10.1101/2024.11.15.623701v1.full.pdf + code: + type: 'reproducible' + text: '[ð\x9F\x9B\_ï¸\x8FGitHub](https://github.com/HanwenZhu98/CellPatch)' + url: 'https://github.com/HanwenZhu98/CellPatch' + omic_modalities: '-' + pre_training_dataset: '-' + input_embedding: '-' + architecture: '-' + ssl_tasks: '-' + supervised_tasks: '-' + +- model: GRNPT + paper: + type: preprint + text: '[Guangzheng Weng et al. 2024](https://advanced.onlinelibrary.wiley.com/doi/pdf/10.1002/advs.202409990)' + url: https://advanced.onlinelibrary.wiley.com/doi/pdf/10.1002/advs.202409990 + code: + type: 'evaluation_only' + text: '[ð\x9F\x94\x8DGitHub](https://github.com/wgzgithub/GRNPT)' + url: 'https://github.com/wgzgithub/GRNPT' + omic_modalities: '-' + pre_training_dataset: '-' + input_embedding: '-' + architecture: '-' + ssl_tasks: '-' + supervised_tasks: '-' + + +- model: Aido.cell + paper: + type: preprint + text: '[Nicholas Ho et al. 2024](https://www.biorxiv.org/content/10.1101/2024.11.28.625303v1.full)' + url: https://www.biorxiv.org/content/10.1101/2024.11.28.625303v1.full + code: + type: 'evaluation_only' + text: '[ð\x9F\x94\x8DGitHub](https://github.com/wgzgithub/GRNPT)' + url: 'https://huggingface.co/genbio-ai/AIDO.Cell-100M/tree/main' + omic_modalities: '-' + pre_training_dataset: '-' + input_embedding: '-' + architecture: '-' + ssl_tasks: '-' + supervised_tasks: '-' + +- model: sctel + paper: + type: peer_reviewed + text: '[Yuanyuan Chen et al. 2024](https://www.nature.com/articles/s41540-024-00484-9)' + url: https://www.nature.com/articles/s41540-024-00484-9 + code: + type: 'reproducible' + text: '[ð\x9F\x9B\_ï¸\x8FGitHub](https://github.com/142857cyy/scTEL)' + u'rl: 'https://github.com/142857cyy/scTEL' + omic_modalities: '-' + pre_training_dataset: '-' + input_embedding: '-' + architecture: '-' + ssl_tasks: '-' + supervised_tasks: '-' + + +- model: "Toward a privacy-preserving predictive foundation model" + paper: + type: preprint + text: '[Jiayuan Ding et al. 2024](https://www.biorxiv.org/content/10.1101/2025.01.06.631427v1.full.pdf)' + url: https://www.biorxiv.org/content/10.1101/2025.01.06.631427v1.full.pdf + code: + type: '-' + text: '-' + url: '-' + omic_modalities: '-' + pre_training_dataset: '-' + input_embedding: '-' + architecture: '-' + ssl_tasks: '-' + supervised_tasks: '-' + +- model: mcBERT + paper: + type: preprint + text: '[von Querfurth et al. 2024](https://doi.org/10.1101/2024.11.04.621897)' + url: https://doi.org/10.1101/2024.11.04.621897 + code: + type: reproducible + text: "[ð\x9F\x9B\_ï¸\x8FGithub](https://github.com/COMSYS/mcBERT)" + url: https://github.com/COMSYS/mcBERT + omic_modalities: scRNA-seq + pre_training_dataset: 7M cells single tissue, human (see Table 1 in the paper; heart, kidney, PBMC, and lung) + input_embedding: Cells as tokens + value projection + architecture: Transformer Encoder / BERT + ssl_tasks: MLM on cell-level, based on unmasked cells of patient + supervised_tasks: Phenotype classification +- model: CancerFoundation + paper: + type: preprint + text: '[Theus et al. 2024](https://doi.org/10.1101/2024.11.01.621087)' + url: https://doi.org/10.1101/2024.11.01.621087 + code: + type: reproducible + text: "[ð\x9F\x9B\_ï¸\x8FGithub](https://github.com/BoevaLab/CancerFoundation)" + url: https://github.com/BoevaLab/CancerFoundation + omic_modalities: scRNA-seq + pre_training_dataset: '1M / Only malignant cells from the [Curated Cancer Cell Atlas](https://www.nature.com/articles/s41586-023-06130-4)' + input_embedding: 'Value categorization: value binning' + architecture: 'Other: attention masking in encoder' + ssl_tasks: Iterative MLM variant with MSE loss, cell token expression prediction, gene expression prediction + supervised_tasks: Drug response prediction - model: Precious3GPT paper: type: preprint diff --git a/_site/_data/transformer-evaluation.yml b/_site/_data/transformer-evaluation.yml index 55aa966..bc35cf4 100644 --- a/_site/_data/transformer-evaluation.yml +++ b/_site/_data/transformer-evaluation.yml @@ -1,3 +1,103 @@ +- paper: + type: preprint + text: '[Kaspar Märtens et al. 2024](https://openreview.net/pdf?id=eb3ndUlkt4)' + url: https://openreview.net/pdf?id=eb3ndUlkt4 + code: + type: 'reproducible' + text: '[ð\x9F\x9B\_ï¸\x8FGitHub](https://github.com/valence-labs/Tx-Evaluation)' + url: 'https://github.com/valence-labs/Tx-Evaluation' + omic_modalities: '-' + evaluated_transformers: '-' + tasks: '-' + notes: '-' + + + +- paper: + type: preprint + text: '[Ihab Bendidi et al. 2024](https://arxiv.org/pdf/2410.13956)' + url: https://arxiv.org/pdf/2410.13956 + code: + type: 'reproducible' + text: '[ð\x9F\x9B\_ï¸\x8FGitHub](https://github.com/valence-labs/Tx-Evaluation)' + url: 'https://github.com/valence-labs/Tx-Evaluation' + omic_modalities: '-' + evaluated_transformers: '-' + tasks: '-' + notes: '-' + + +- paper: + type: preprint + text: '[George Crowley et al. 2024](https://www.biorxiv.org/content/10.1101/2024.10.10.617605v1.full.pdf)' + url: https://www.biorxiv.org/content/10.1101/2024.10.10.617605v1.full.pdf + code: + type: 'reproducible' + text: '[ð\x9F\x9B\_ï¸\x8FGitHub](https://github.com/ggit12/anndictionary/)' + url: 'https://github.com/ggit12/anndictionary/' + omic_modalities: '-' + evaluated_transformers: '-' + tasks: '-' + notes: '-' + + + +- paper: + type: preprint + text: '[George Crowley et al. 2024](https://www.biorxiv.org/content/10.1101/2024.10.10.617605v1.full.pdf)' + url: https://www.biorxiv.org/content/10.1101/2024.10.10.617605v1.full.pdf + code: + type: 'reproducible' + text: '[ð\x9F\x9B\_ï¸\x8FGitHub](https://github.com/ggit12/anndictionary/)' + url: 'https://github.com/ggit12/anndictionary/' + omic_modalities: '-' + evaluated_transformers: '-' + tasks: '-' + notes: '-' + + +- paper: + type: preprint + text: '[Yan Wu et al. 2024](https://scholar.google.com/scholar?cluster=18315006149844520972&hl=en&as_sdt=0,5)' + url: https://scholar.google.com/scholar?cluster=18315006149844520972&hl=en&as_sdt=0,5 + code: + type: 'reproducible' + text: '[ð\x9F\x9B\_ï¸\x8FGitHub](https://github.com/altoslabs/perturbench)' + url: 'https://github.com/altoslabs/perturbench' + omic_modalities: '-' + evaluated_transformers: '-' + tasks: '-' + notes: '-' + +- paper: + type: preprint + text: '[A. Wenteler et al. 2024](https://www.biorxiv.org/content/10.1101/2024.10.02.616248v1.abstract)' + url: https://www.biorxiv.org/content/10.1101/2024.10.02.616248v1.abstract + code: + type: 'reproducible' + text: '[ð\x9F\x9B\_ï¸\x8FGitHub](https://github.com/aaronwtr/PertEval)' + url: 'https://github.com/aaronwtr/PertEval' + omic_modalities: '-' + evaluated_transformers: '-' + tasks: '-' + notes: '-' + + + +- paper: + type: preprint + text: '[Eric Kernfeld et al. 2024](https://www.biorxiv.org/content/10.1101/2023.07.28.551039v2.full)' + url: https://www.biorxiv.org/content/10.1101/2023.07.28.551039v2.full + code: + type: 'reproducible' + text: '[ð\x9F\x9B\_ï¸\x8FGitHub](https://github.com/ekernf01/perturbation_benchmarking)' + url: 'https://github.com/ekernf01/perturbation_benchmarking' + omic_modalities: '-' + evaluated_transformers: '-' + tasks: '-' + notes: '-' + + - paper: type: preprint text: '[Yoav Kan-Tor et al. 2024](https://arxiv.org/abs/2412.04075)' @@ -9,7 +109,7 @@ omic_modalities: Natural Language, scRNAseq, protein sequence, DNA sequence evaluated_transformers: Mistral, MPnet, CellPLM, GeneFormer, scGPT, DNABert2, ESM (plus bag-of-words, gene2vec) tasks: genomic properties, gene regulatory functions, gene localization, gene biological processes, protein properties - notes: '-' + notes: 'Evaluating model performance using gene embeddings allows comparing models utilizing different data modalities. The performance profile of a diverse set of models across ~300 gene related tasks was shown to be most influenced by the training modality.' - paper: type: preprint text: '[Ahlmann-Eltze et al. 2024](https://www.biorxiv.org/content/10.1101/2024.09.16.613342)' diff --git a/_site/_data/transformer-llms.yml b/_site/_data/transformer-llms.yml index f01e8a6..978c6c7 100644 --- a/_site/_data/transformer-llms.yml +++ b/_site/_data/transformer-llms.yml @@ -1,3 +1,20 @@ +- model: stFormer + paper: + type: preprint + text: '[Shenghao Cao et al. 2024](https://www.biorxiv.org/content/10.1101/2024.09.27.615337v1)' + url: https://www.biorxiv.org/content/10.1101/2024.09.27.615337v1 + code: + type: 'reproducible' + text: "[ð\x9F\x94\x8DGitHub](https://github.com/ucaswangls/STFormer)" + url: 'https://github.com/ucaswangls/STFormer' + omic_modalities: '-' + pre_training_dataset: '-' + input_embedding: '-' + architecture: '-' + ssl_tasks: '-' + supervised_tasks: '-' + + - model: scChat paper: type: preprint diff --git a/_site/_pages/implementations.html b/_site/_pages/implementations.html index 8c37983..f9f4e09 100644 --- a/_site/_pages/implementations.html +++ b/_site/_pages/implementations.html @@ -974,9 +974,9 @@