VectorInstitute · a-kore · Jul 3, 2024 · Jun 26, 2024 · Jun 26, 2024 · Jun 26, 2024
diff --git a/README.md b/README.md
@@ -10,10 +10,10 @@
 ## Table of Contents
 
 - [Introduction](#introduction)
+- [Installation](#installation)
 - [Datasets](#datasets)
 - [Models](#models)
 - [Tasks](#tasks)
-- [Installation](#installation)
 - [Developing](#🧑🏿‍💻-developing)
 
 ## Introduction
@@ -22,6 +22,16 @@ AtomGen provides a robust framework for handling atomistic graph datasets focusi
 
 It streamlines the process of aggregation, standardization, and utilization of datasets from diverse sources, enabling large-scale pre-training and generative modeling on atomistic graphs.
 
+
+## Installation
+
+The package can be installed using poetry:
+
+```bash
+python3 -m poetry install
+source $(poetry env info --path)/bin/activate
+```
+
 ## Datasets
 
 AtomGen facilitates the aggregation and standardization of datasets, including but not limited to:
@@ -36,9 +46,9 @@ Currently, AtomGen has pre-processed datasets for the S2EF pre-training task for
 
 AtomGen supports a variety of models for training on atomistic graph datasets, including:
 
-  - SchNet
-  - TokenGT
-  - Uni-Mol+ (Modified)
+  - **[SchNet](https://arxiv.org/abs/1706.08566)**: A continuous-filter convolutional neural network for modeling quantum interactions.
+  - **[TokenGT](https://github.com/jw9730/tokengt)**: Tokenized graph transformer that treats all nodes and edges as independent tokens.
+  - **AtomFormer**: Custom architecture that leverages gaussian pair-wise positional embeddings and self-attention to model atomistic graphs.
 
 ## Tasks
 
@@ -50,16 +60,7 @@ Experimentation with pre-training tasks is facilitated through AtomGen, includin
 
   - **Coordinate Denoising**: Denoising atom coordinates.
 
-These tasks are all facilitated through the DataCollatorForAtomModeling class and can be used simultaneously or individually.
-
-## Installation
-
-The package can be installed using poetry:
-
-```bash
-python3 -m poetry install
-source $(poetry env info --path)/bin/activate
-```
+These tasks are all facilitated through the `DataCollatorForAtomModeling` class and can be used simultaneously or individually.
 
 
 ## 🧑🏿‍💻 Developing

diff --git a/...odels/configs/unimolplus-base-expand.json → atomgen/models/configs/atomformer-base.json b/...odels/configs/unimolplus-base-expand.json → atomgen/models/configs/atomformer-base.json
@@ -5,8 +5,6 @@
     "depth": 12,
     "mlp_ratio": 4,
     "k": 128,
-    "op_hidden_dim": 16,
-    "tr_hidden_dim": 16,
     "dropout": 0.0,
     "mask_token_id": 0,
     "pad_token_id": 119,

diff --git a/...gen/models/configs/transformer-large.json → atomgen/models/configs/atomformer-large.json b/...gen/models/configs/transformer-large.json → atomgen/models/configs/atomformer-large.json
@@ -1,9 +1,11 @@
 {
-    "vocab_size": 122,
+    "vocab_size": 123,
     "dim": 1024,
-    "num_heads": 16,
+    "num_heads": 32,
     "depth": 24,
     "mlp_ratio": 4,
+    "k": 128,
+    "dropout": 0.0,
     "mask_token_id": 0,
     "pad_token_id": 119,
     "bos_token_id": 120,

diff --git a/...odels/configs/unimolplus-mini-expand.json → atomgen/models/configs/atomformer-mini.json b/...odels/configs/unimolplus-mini-expand.json → atomgen/models/configs/atomformer-mini.json
diff --git a/...dels/configs/unimolplus-small-expand.json → atomgen/models/configs/atomformer-small.json b/...dels/configs/unimolplus-small-expand.json → atomgen/models/configs/atomformer-small.json
diff --git a/atomgen/models/configs/unimolplus-base.json → atomgen/models/configs/atomformer-tiny.json b/atomgen/models/configs/unimolplus-base.json → atomgen/models/configs/atomformer-tiny.json
@@ -1,9 +1,9 @@
 {
     "vocab_size": 123,
-    "dim": 768,
-    "num_heads": 32,
-    "depth": 12,
-    "mlp_ratio": 1,
+    "dim": 128,
+    "num_heads": 4,
+    "depth": 2,
+    "mlp_ratio": 4,
     "k": 128,
     "op_hidden_dim": 16,
     "tr_hidden_dim": 16,

diff --git a/atomgen/models/configs/transformer-base.json b/atomgen/models/configs/transformer-base.json
diff --git a/atomgen/models/configs/transformer-mini.json b/atomgen/models/configs/transformer-mini.json
diff --git a/atomgen/models/configs/transformer-small.json b/atomgen/models/configs/transformer-small.json
diff --git a/atomgen/models/configs/transformer-tiny.json b/atomgen/models/configs/transformer-tiny.json
diff --git a/atomgen/models/configs/unimolplus-mini.json b/atomgen/models/configs/unimolplus-mini.json
diff --git a/atomgen/models/configuration_atomformer.py b/atomgen/models/configuration_atomformer.py
@@ -0,0 +1,46 @@
+"""Configuration class for Atomformer."""
+
+from typing import Any
+
+from transformers.configuration_utils import PretrainedConfig
+
+
+class AtomformerConfig(PretrainedConfig):  # type: ignore
+    r"""
+    Configuration of a :class:`~transform:class:`~transformers.AtomformerModel`.
+
+    It is used to instantiate an Atomformer model according to the specified arguments.
+    """
+
+    model_type = "atomformer"
+
+    def __init__(
+        self,
+        vocab_size: int = 123,
+        dim: int = 768,
+        num_heads: int = 32,
+        depth: int = 12,
+        mlp_ratio: int = 1,
+        k: int = 128,
+        dropout: float = 0.0,
+        mask_token_id: int = 0,
+        pad_token_id: int = 119,
+        bos_token_id: int = 120,
+        eos_token_id: int = 121,
+        cls_token_id: int = 122,
+        **kwargs: Any,
+    ) -> None:
+        super().__init__(**kwargs)
+        self.vocab_size = vocab_size
+        self.dim = dim
+        self.num_heads = num_heads
+        self.depth = depth
+        self.mlp_ratio = mlp_ratio
+        self.k = k
+
+        self.dropout = dropout
+        self.mask_token_id = mask_token_id
+        self.pad_token_id = pad_token_id
+        self.bos_token_id = bos_token_id
+        self.eos_token_id = eos_token_id
+        self.cls_token_id = cls_token_id