Materials-Consortia · JPBergsma · Aug 17, 2022 · Aug 17, 2022 · Aug 17, 2022 · Aug 27, 2022
@@ -37,6 +37,7 @@ Instead, if you are storing chemical formulae as an unreduced count per simulati
 This would then instead require option 2 above, namely either the addition of auxiliary fields that store the correct (or mappable) OPTIMADE format in the database, or the creation of a secondary database that returns the pre-converted structures.
 
 In the simplest case, the mapper classes can be used to define aliases between fields in the database and the OPTIMADE field name; these can be configured via the [`aliases`][optimade.server.config.ServerConfig.aliases] option as a dictionary mapping stored in a dictionary under the appropriate endpoint name, e.g. `"aliases": {"structures": {"chemical_formula_reduced": "my_chem_form"}}`, or defined as part of a custom mapper class.
+If the alias is a nested field (i.e., a field within a dictionary), the field names should be separated by `"."`, for example: `"aliases": { "structures": {"chemical_formula_reduced": "formulae.reduced"}}`.
 
 In either option, you should now be able to insert your data into the corresponding MongoDB (or otherwise) collection.
 

@@ -298,6 +298,19 @@ def check_illegal_attributes_fields(cls, values):
                 )
         return values
 
+    @root_validator(pre=True)
+    def set_missing_to_none(cls, values):
+        if "set_missing_to_none" in values and values.pop("set_missing_to_none"):
+            for field in cls.schema()["required"]:
+                if field not in values:
+                    if (
+                        field == "structure_features"
+                    ):  # It would be nice if there would be a more universal way to handle special cases like this.
+                        values[field] = []
+                    else:
+                        values[field] = None
+        return values
+
 
 class Resource(BaseResource):
     """Resource objects appear in a JSON API document to represent resources."""

@@ -35,11 +35,11 @@ class Aggregate(Enum):
 class LinksResourceAttributes(Attributes):
     """Links endpoint resource object attributes"""
 
-    name: str = StrictField(
+    name: Optional[str] = StrictField(
         ...,
         description="Human-readable name for the OPTIMADE API implementation, e.g., for use in clients to show the name to the end-user.",
     )
-    description: str = StrictField(
+    description: Optional[str] = StrictField(
         ...,
         description="Human-readable description for the OPTIMADE API implementation, e.g., for use in clients to show a description to the end-user.",
     )

@@ -1,7 +1,7 @@
 # pylint: disable=line-too-long,no-self-argument
 from typing import List, Optional
 
-from pydantic import AnyUrl, BaseModel, validator  # pylint: disable=no-name-in-module
+from pydantic import AnyUrl, BaseModel  # pylint: disable=no-name-in-module
 
 from optimade.models.entries import EntryResource, EntryResourceAttributes
 from optimade.models.utils import OptimadeField, SupportLevel
@@ -260,9 +260,3 @@ class ReferenceResource(EntryResource):
         queryable=SupportLevel.MUST,
     )
     attributes: ReferenceResourceAttributes
-
-    @validator("attributes")
-    def validate_attributes(cls, v):
-        if not any(prop[1] is not None for prop in v):
-            raise ValueError("reference object must have at least one field defined")
-        return v
@@ -5,6 +5,7 @@
     },
     "assemblies": null,
     "chemsys": "Ac",
+    "dichtheid": 10.07,
     "cartesian_site_positions": [
       [
         0.17570227444196573,
@@ -1222,6 +1223,7 @@
     "nelements": 5,
     "nsites": 24,
     "pretty_formula": "Ag2C6ClH12N3",
+    "fancy_formulas": {"hill": "C6H12Ag2ClN3"},
     "species": [
       {
         "chemical_symbols": [
@@ -1475,6 +1477,9 @@
     "nelements": 5,
     "nsites": 25,
     "pretty_formula": "Ag2C2H2N6O13",
+    "fancy_formulas" : {
+      "hill": "C2H2Ag2N6O13"
+    },
     "species": [
       {
         "chemical_symbols": [
@@ -1723,6 +1728,7 @@
     "nelements": 7,
     "nsites": 23,
     "pretty_formula": "Ag2C2ClH8N5O3S2",
+    "fancy_formulas": {"hill": "C2H8Ag2ClN5O3S2"},
     "species": [
       {
         "chemical_symbols": [
@@ -2467,6 +2473,7 @@
     "nelements": 8,
     "nsites": 74,
     "pretty_formula": "AgB10C15Cl2H40NO3P2",
+    "fancy_formulas": {"hill": "C15H40AgB10Cl2NO3P2"},
     "species": [
       {
         "chemical_symbols": [
@@ -2821,6 +2828,7 @@
     "nelements": 7,
     "nsites": 29,
     "pretty_formula": "AgC3ClH14N6OS3",
+    "fancy_formulas":{"hill": "C3H14AgClN6OS3"},
     "species": [
       {
         "chemical_symbols": [

@@ -168,9 +168,7 @@ def _run_db_query(
         page_offset = criteria.get("skip", 0)
         limit = criteria.get("limit", CONFIG.page_limit)
 
-        all_aliased_fields = [
-            self.resource_mapper.get_backend_field(field) for field in self.all_fields
-        ]
+        all_aliased_fields = [field for field in criteria.get("projection", [])]
         search = search.source(includes=all_aliased_fields)
 
         elastic_sort = [

@@ -1,6 +1,7 @@
 import re
 import warnings
 from abc import ABC, abstractmethod
+from functools import lru_cache
 from typing import Any, Dict, Iterable, List, Set, Tuple, Type, Union
 
 from lark import Transformer
@@ -11,6 +12,7 @@
 from optimade.server.config import CONFIG, SupportedBackend
 from optimade.server.mappers import BaseResourceMapper
 from optimade.server.query_params import EntryListingQueryParams, SingleEntryQueryParams
+from optimade.utils import set_field_to_none_if_missing_in_dict
 from optimade.warnings import (
     FieldValueNotRecognized,
     QueryParamNotUsed,
@@ -121,13 +123,7 @@ def count(self, **kwargs: Any) -> int:
 
     def find(
         self, params: Union[EntryListingQueryParams, SingleEntryQueryParams]
-    ) -> Tuple[
-        Union[List[EntryResource], EntryResource],
-        int,
-        bool,
-        Set[str],
-        Set[str],
-    ]:
+    ) -> Tuple[Union[List[EntryResource], EntryResource], int, bool, Set[str]]:
         """
         Fetches results and indicates if more data is available.
 
@@ -146,23 +142,49 @@ def find(
         criteria = self.handle_query_params(params)
         single_entry = isinstance(params, SingleEntryQueryParams)
         response_fields = criteria.pop("fields")
+        response_fields_set = criteria.pop("response_fields_set", False)
 
         raw_results, data_returned, more_data_available = self._run_db_query(
             criteria, single_entry
         )
 
+        exclude_fields = self.all_fields - response_fields
+
+        results: List = [self.resource_mapper.map_back(doc) for doc in raw_results]
+
+        self.check_and_add_missing_fields(results, response_fields, response_fields_set)
+
+        if results:
+            results = self.resource_mapper.deserialize(results)
+
         if single_entry:
-            raw_results = raw_results[0] if raw_results else None  # type: ignore[assignment]
+            results = results[0] if results else None  # type: ignore[assignment]
 
             if data_returned > 1:
                 raise NotFound(
                     detail=f"Instead of a single entry, {data_returned} entries were found",
                 )
 
-        exclude_fields = self.all_fields - response_fields
+        return results, data_returned, more_data_available, exclude_fields
+
+    def check_and_add_missing_fields(
+        self, results: List[dict], response_fields: set, response_fields_set: bool
+    ):
+        """Checks whether the response_fields and mandatory fields are present.
+        If they are not present the values are set to None, so the deserialization works correctly.
+        It also checks whether all fields in the response have been defined either in the model or in the config file.
+        If not it raises an appropriate error or warning."""
         include_fields = (
             response_fields - self.resource_mapper.TOP_LEVEL_NON_ATTRIBUTES_FIELDS
         )
+        # Include missing fields
+        for result in results:
+            for field in include_fields:
+                set_field_to_none_if_missing_in_dict(result["attributes"], field)
+
+        if response_fields_set:
+            for result in results:
+                result["attributes"]["set_missing_to_none"] = True
 
         bad_optimade_fields = set()
         bad_provider_fields = set()
@@ -189,19 +211,6 @@ def find(
                 detail=f"Unrecognised OPTIMADE field(s) in requested `response_fields`: {bad_optimade_fields}."
             )
 
-        if raw_results is not None:
-            results = self.resource_mapper.deserialize(raw_results)
-        else:
-            results = None
-
-        return (
-            results,
-            data_returned,
-            more_data_available,
-            exclude_fields,
-            include_fields,
-        )
-
     @abstractmethod
     def _run_db_query(
         self, criteria: Dict[str, Any], single_entry: bool = False
@@ -244,6 +253,7 @@ def all_fields(self) -> Set[str]:
 
         return self._all_fields
 
+    @lru_cache(maxsize=4)
     def get_attribute_fields(self) -> Set[str]:
         """Get the set of attribute fields
 
@@ -327,16 +337,16 @@ def handle_query_params(
             cursor_kwargs["limit"] = CONFIG.page_limit
 
         # response_fields
-        cursor_kwargs["projection"] = {
-            f"{self.resource_mapper.get_backend_field(f)}": True
-            for f in self.all_fields
-        }
-
         if getattr(params, "response_fields", False):
+            cursor_kwargs["response_fields_set"] = True
             response_fields = set(params.response_fields.split(","))
             response_fields |= self.resource_mapper.get_required_fields()
         else:
             response_fields = self.all_fields.copy()
+        cursor_kwargs["projection"] = {
+            f"{self.resource_mapper.get_backend_field(f)}": True
+            for f in response_fields
+        }
 
         cursor_kwargs["fields"] = response_fields