Skip to content

Commit

Permalink
Return GET /search as OPTIMADE or not
Browse files Browse the repository at this point in the history
Add possibility to return responses from `GET /search` as an OPTIMADE
entry-listing response or as the "standard" gateway query response.

In doing this, some things have been optimized.
Mainly the logic surrounding retrieving and naming databases in the
`POST /search` endpoint.
In order to return a query response as a valid OPTIMADE response, a
method has been added to the `QueryResource` model, which works
similarly to `GET /gateways/<id>/structures`, but working from the basis
of the finished query.
It updates the entry `id`s by prepending the `provider/database/` name,
making the `id`s unique.

Extra safety has been added to the creation of gateway resources, as the
`resource_factory()` now expects a pre-treating `GatewayCreate` entity,
where there are no "unknown" database `id`s in the `database_ids`
attribute. Unknown meaning that all `database_ids` must be represented
in the `databases` attribute.
  • Loading branch information
CasperWA committed Aug 23, 2021
1 parent e4b153b commit 125157d
Show file tree
Hide file tree
Showing 10 changed files with 281 additions and 48 deletions.
4 changes: 3 additions & 1 deletion optimade_gateway/models/gateways.py
Original file line number Diff line number Diff line change
Expand Up @@ -140,7 +140,9 @@ class GatewayCreate(EntryResourceCreate, GatewayResourceAttributes):

@root_validator
def specify_databases(cls, values: dict) -> dict:
"""Either `database_ids` or `databases` must be non-empty"""
"""Either `database_ids` or `databases` must be non-empty.
Both together is also fine.
"""
if not any(values.get(field) for field in ("database_ids", "databases")):
raise ValueError("Either 'database_ids' or 'databases' MUST be specified")
return values
92 changes: 92 additions & 0 deletions optimade_gateway/models/queries.py
Original file line number Diff line number Diff line change
@@ -1,11 +1,14 @@
"""Pydantic models/schemas for the Queries resource"""
from enum import Enum
from typing import Any, Dict, List, Optional, Union
import urllib.parse
import warnings

from optimade.models import (
EntryResource,
EntryResourceAttributes,
EntryResponseMany,
ErrorResponse,
OptimadeError,
ReferenceResource,
ReferenceResponseMany,
Expand All @@ -19,6 +22,7 @@
from optimade.models.utils import StrictField
from optimade.server.query_params import EntryListingQueryParams
from pydantic import BaseModel, EmailStr, Field, validator
from starlette.datastructures import URL as StarletteURL

from optimade_gateway.models.resources import EntryResourceCreate
from optimade_gateway.warnings import SortNotSupported
Expand Down Expand Up @@ -210,6 +214,94 @@ class QueryResource(EntryResource):
)
attributes: QueryResourceAttributes

async def response_as_optimade(
self,
url: Optional[
Union[urllib.parse.ParseResult, urllib.parse.SplitResult, StarletteURL, str]
] = None,
) -> Union[EntryResponseMany, ErrorResponse]:
"""Return `attributes.response` as a valid OPTIMADE entry listing response.
Note, this method disregards the state of the query and will simply return the query results
as they currently are (if there are any at all).
Parameters:
url: Optionally, update the `meta.query.representation` value with this.
Returns:
A valid OPTIMADE entry-listing response according to the
[OPTIMADE specification](https://github.com/Materials-Consortia/OPTIMADE/blob/master/optimade.rst#entry-listing-endpoints)
or an error response, if errors were returned or occurred during the query.
"""
from copy import deepcopy
from optimade.server.routers.utils import meta_values

async def _update_id(
entry_: Union[EntryResource, Dict[str, Any]], database_provider_: str
) -> Union[EntryResource, Dict[str, Any]]:
"""Internal utility function to prepend the entries' `id` with `provider/database/`."""
if isinstance(entry_, dict):
_entry = deepcopy(entry_)
_entry["id"] = f"{database_provider_}/{entry_['id']}"
else:
_entry = entry_.copy(deep=True)
_entry.id = f"{database_provider_}/{entry_.id}"
return _entry

if not self.attributes.response:
# The query as not yet been initiated
return ErrorResponse(
errors=[
{
"detail": (
"Can not return as a valid OPTIMADE response as the query has not yet "
"been initialized."
),
"id": "OPTIMADE_GATEWAY_QUERY_NOT_INITIALIZED",
}
],
meta=meta_values(
url=url or f"/queries/{self.id}?",
data_returned=0,
data_available=0,
more_data_available=False,
),
)

meta_ = self.attributes.response.meta
if url:
meta_ = meta_.dict(exclude_unset=True)
for repeated_key in (
"query",
"api_version",
"time_stamp",
"provider",
"implementation",
):
meta_.pop(repeated_key, None)
meta_ = meta_values(url=url, **meta_)

# Error response
if self.attributes.response.errors:
return ErrorResponse(
errors=self.attributes.response.errors,
meta=meta_,
)

# Data response
results = []
for database_provider, entries in self.attributes.response.data.items():
results.extend(
[await _update_id(entry, database_provider) for entry in entries]
)

return self.attributes.endpoint.get_response_model()(
data=results,
meta=meta_,
links=self.attributes.response.links,
)


class QueryCreate(EntryResourceCreate, QueryResourceAttributes):
"""Model for creating new Query resources in the MongoDB"""
Expand Down
15 changes: 15 additions & 0 deletions optimade_gateway/queries/params.py
Original file line number Diff line number Diff line change
Expand Up @@ -35,6 +35,11 @@ class in `optimade´, which defines the standard entry listing endpoint query pa
time, a redirection will still be performed, but to a zero-results page, which can be
refreshed to get the finished query (once it has finished).
as_optimade (bool): Return the response as a standard OPTIMADE entry listing endpoint
response. Otherwise, the response will be based on the
[`QueriesResponseSingle`][optimade_gateway.models.responses.QueriesResponseSingle]
model.
"""

def __init__(
Expand Down Expand Up @@ -72,8 +77,18 @@ def __init__(
"which can be refreshed to get the finished query (once it has finished)."
),
),
as_optimade: bool = Query(
False,
description=(
"Return the response as a standard OPTIMADE entry listing endpoint response. "
"Otherwise, the response will be based on the "
"[`QueriesResponseSingle`][optimade_gateway.models.responses.QueriesResponseSingle]"
" model."
),
)
) -> None:
self.database_ids = database_ids
self.optimade_urls = optimade_urls
self.endpoint = endpoint
self.timeout = timeout
self.as_optimade = as_optimade
30 changes: 29 additions & 1 deletion optimade_gateway/queries/perform.py
Original file line number Diff line number Diff line change
Expand Up @@ -288,6 +288,34 @@ def db_find(
try:
response = ErrorResponse(**response)
except ValidationError as exc:
# If it's an error and `meta` is missing, it is not a valid OPTIMADE response,
# but this happens a lot, and is therefore worth having an edge-case for.
if "errors" in response:
errors = list(response["errors"])
errors.append(
{
"detail": (
f"Could not pass response from {url} as either a "
f"{response_model.__name__!r} or 'ErrorResponse'. "
f"ValidationError: {exc}"
),
"id": "OPTIMADE_GATEWAY_DB_FINDS_MANY_VALIDATIONERRORS",
}
)
return (
ErrorResponse(
errors=errors,
meta={
"query": {
"representation": f"/{endpoint.strip('/')}?{query_params}"
},
"api_version": __api_version__,
"more_data_available": False,
},
),
get_resource_attribute(database, "id"),
)

return (
ErrorResponse(
errors=[
Expand All @@ -297,7 +325,7 @@ def db_find(
f"{response_model.__name__!r} or 'ErrorResponse'. "
f"ValidationError: {exc}"
),
"id": "OPTIMADE_GATEWAY_DB_FIND_MANY_VALIDATIONERROR",
"id": "OPTIMADE_GATEWAY_DB_FINDS_MANY_VALIDATIONERRORS",
}
],
meta={
Expand Down
20 changes: 16 additions & 4 deletions optimade_gateway/queries/process.py
Original file line number Diff line number Diff line change
Expand Up @@ -10,6 +10,7 @@
OptimadeError,
)

from optimade_gateway.common.config import CONFIG
from optimade_gateway.common.utils import get_resource_attribute
from optimade_gateway.models import GatewayResource, QueryResource
from optimade_gateway.queries.utils import update_query
Expand Down Expand Up @@ -75,10 +76,21 @@ async def process_db_response(
meta_error = error.meta.dict()
meta_error.update(
{
"optimade_gateway": {
"gateway": gateway,
"source_database_id": database_id,
}
f"_{CONFIG.provider.prefix}_source_gateway": {
"id": gateway.id,
"type": gateway.type,
"links": {"self": gateway.links.self},
},
f"_{CONFIG.provider.prefix}_source_database": {
"id": database_id,
"type": "links",
"links": {
"self": (
str(gateway.links.self).split("gateways")[0]
+ f"databases/{database_id}"
)
},
},
}
)
error.meta = Meta(**meta_error)
Expand Down
4 changes: 3 additions & 1 deletion optimade_gateway/routers/databases.py
Original file line number Diff line number Diff line change
Expand Up @@ -128,7 +128,9 @@ async def get_database(
) = await DATABASES_COLLECTION.find(params=params)

if fields or include_fields and result is not None:
result = handle_response_fields(result, fields, include_fields)[0]
result = handle_response_fields(result, fields, include_fields)

result = result[0] if data_returned else None

return DatabasesResponseSingle(
links=ToplevelLinks(next=None),
Expand Down
35 changes: 27 additions & 8 deletions optimade_gateway/routers/gateway/structures.py
Original file line number Diff line number Diff line change
Expand Up @@ -86,8 +86,14 @@ async def get_structures(
if isinstance(gateway_response, ErrorResponse):
for error in gateway_response.errors:
if error.status:
response.status_code = int(error.status)
break
for part in error.status.split(" "):
try:
response.status_code = int(part)
break
except ValueError:
pass
if response.status_code and response.status_code >= 300:
break
else:
response.status_code = 500
return gateway_response
Expand Down Expand Up @@ -134,6 +140,7 @@ async def get_single_structure(
Example: `GET /gateways/some_gateway/structures/some_database/some_structure`.
"""
from optimade_gateway.common.config import CONFIG
from optimade_gateway.models import GatewayResource
from optimade_gateway.queries import db_find
from optimade_gateway.routers.utils import get_valid_resource
Expand Down Expand Up @@ -182,10 +189,16 @@ async def get_single_structure(
meta = error.meta.dict()
meta.update(
{
"optimade_gateway": {
"gateway": gateway,
"source_database_id": database.id,
}
f"_{CONFIG.provider.prefix}_source_gateway": {
"id": gateway.id,
"type": gateway.type,
"links": {"self": gateway.links.self},
},
f"_{CONFIG.provider.prefix}_source_database": {
"id": database.id,
"type": database.type,
"links": {"self": database.links.self},
},
}
)
error.meta = Meta(**meta)
Expand Down Expand Up @@ -239,8 +252,14 @@ async def get_single_structure(
if isinstance(gateway_response, ErrorResponse):
for error in errors or gateway_response.errors:
if error.status:
response.status_code = int(error.status)
break
for part in error.status.split(" "):
try:
response.status_code = int(part)
break
except ValueError:
pass
if response.status_code and response.status_code >= 300:
break
else:
response.status_code = 500

Expand Down
10 changes: 8 additions & 2 deletions optimade_gateway/routers/queries.py
Original file line number Diff line number Diff line change
Expand Up @@ -136,8 +136,14 @@ async def get_query(
if query.attributes.response.errors:
for error in query.attributes.response.errors:
if error.status:
response.status_code = int(error.status)
break
for part in error.status.split(" "):
try:
response.status_code = int(part)
break
except ValueError:
pass
if response.status_code and response.status_code >= 300:
break
else:
response.status_code = 500

Expand Down
Loading

0 comments on commit 125157d

Please sign in to comment.