python-client-generator/python_client_generator/generate_models.py at 95dd0e45f87b3a49592ce6f59965a1465eea57c6 · sennder/python-client-generator · GitHub

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
import os
import re

from pathlib import Path
from typing import Any, Dict, List

import chevron

from .utils import resolve_type, sanitize_name, serialize_to_python_code


dir_path = Path(os.path.dirname(os.path.realpath(__file__)))
templates_path = dir_path / "templates"


def resolve_field_args(property: Dict[str, Any]) -> Dict[str, Any]:
    """
    Map OpenAPI properties to Pydantic Field function args
    """
    args = {}
    if "maxLength" in property:
        args["max_length"] = property["maxLength"]
    if "minLength" in property:
        args["min_length"] = property["minLength"]
    # TODO: decide later if we want the description field or a comment above the line
    # if "description" in property:
    #     args_dict["description"] = property["description"]
    if "default" in property:
        args["default"] = property["default"]

    return args


def serialize_args_dict(args_dict: Dict[str, Any]) -> str:
    args_list = [f"{k}={serialize_to_python_code(v)}" for k, v in args_dict.items()]
    return ", ".join(args_list)


def _get_schema_references(schema: Dict[str, Any]) -> List[str]:
    union_keys = list(set(["allOf", "anyOf", "oneOf"]) & set(schema.keys()))
    if union_keys:
        arr = []
        for p_sub_schema in schema[union_keys[0]]:
            arr += _get_schema_references(p_sub_schema)
        return arr
    elif "type" not in schema:
        return []
    elif schema["type"] == "array":
        return _get_schema_references(schema["items"])
    elif schema["type"] == "object" or (schema["type"] == "string" and "enum" in schema):
        # As some nested enums may not have a title, we need to check for it.
        # This is observed to happen inside the properties of a schema that uses an enum with referencing to another enum schema (raw values instead)  # noqa E501
        # Example:
        # "properties": { # properties of an object schema (type is object)
        #     "status": {
        #         "type": "string",
        #         "enum": [
        #             "active",
        #             "inactive"
        #         ]
        #     }
        # }
        # In this case, the enum values are not defined in a schema with a title, so we need to check for it.  # noqa E501
        # For the case where the enum values are defined in a schema with a title, the title will be used.  # noqa E501
        # Example:
        # "schemas": {
        #     ...,  # other schemas
        #     "Status": {
        #         "title": "Status",
        #         "type": "string",
        #         "enum": [
        #             "active",
        #             "inactive"
        #         ]
        #     }
        # }
        # And then it will be referenced in the properties like this:
        # "properties": { # properties of an object schema (type is object)
        #     "status": {
        #         "$ref": "#/components/schemas/Status"
        #     }
        # }

        return [schema.get("title", "")]
    else:
        return []


def get_references(model: Dict[str, Any]) -> List[str]:
    """
    Get a list of dependencies for a model

    These come from either their properties or unionized referencing.
    """
    refs = []
    union_keys = list(set(["allOf", "anyOf", "oneOf"]) & set(model.keys()))
    if union_keys:
        return _get_schema_references(model)
    elif "properties" in model:
        # Must have properties
        for p_schema in model["properties"].values():
            refs += _get_schema_references(p_schema)

    return [sanitize_name(r) for r in refs]


def get_fields(schema: Dict[str, Any]) -> List[Dict[str, Any]]:
    union_keys = list(set(["allOf", "anyOf", "oneOf"]) & set(schema.keys()))
    if union_keys:
        # Handle union cases by creating a __root__ defined model
        return [{"name": "__root__", "type": resolve_type(schema)}]
    elif "properties" in schema:
        return [
            {
                "name": k,
                "type": resolve_type(v, use_literals=True),
                "optional": "required" not in schema or k not in schema["required"],
                "field_args": serialize_args_dict(resolve_field_args(v)),
            }
            for k, v in schema["properties"].items()
        ]
    else:
        return []


def _strip_nonexistant_refs(objects: List[Dict[str, Any]]) -> None:
    """
    Remove any references to names not in the objects list
    """
    names = [o["name"] for o in objects]
    for o in objects:
        o["refs"] = [ref for ref in o["refs"] if ref in names]


def _get_ref_index(objects: List[Dict[str, Any]], name: str) -> int:
    return next(i for i, o in enumerate(objects) if o["name"] == name)


def _object_has_binary_properties(object: Dict[str, Any]) -> bool:
    """
    Determine if an object has some properties which are binary
    """
    for p in object.get("properties", {}).values():
        if p.get("type") == "string" and p.get("format") == "binary":
            return True
    return False


def _sort_models(objects: List[Dict[str, Any]]) -> List[Dict[str, Any]]:
    """
    Resolve object dependencies by walking through the objects list
    and moving any dependencies which are further along in the list
    ahead of us.
    """
    i = 0
    while i < len(objects):
        sorted = False
        for ref in objects[i]["refs"]:
            ref_index = _get_ref_index(objects, ref)
            if ref_index > i:
                objects.insert(i, objects.pop(ref_index))
                sorted = True

        if not sorted:
            i += 1  # Ensure shifted references reprocessed

    return objects


def get_models(schemas: Dict[str, Any]) -> List[Dict[str, Any]]:
    objects = (v for v in schemas.values() if "type" not in v or v["type"] == "object")

    models = []
    for o in objects:
        # Skip models with "binary" properties as these are related to file uploads
        # and we handle them with function arguments on the API
        if _object_has_binary_properties(o):
            continue

        p: Dict[str, Any] = {}
        p["refs"] = get_references(o)
        p["name"] = sanitize_name(o["title"])
        p["fields"] = get_fields(o)
        models.append(p)

    _strip_nonexistant_refs(models)
    _sort_models(models)
    return models


def _enum_val_to_name(value: Any) -> str:
    """
    Generate name for each enumeration value.
    """
    if isinstance(value, (int, float)):
        return "NUMBER_" + str(float(value)).replace(".", "_DOT_")
    elif isinstance(value, (str)):
        # TODO: use proper regex replace to insure we don't create variable names non
        # compliant with Python syntax
        char_list = [" ", "-", ".", ",", "&"]
        for c in char_list:
            value = value.replace(c, "_")
        return "".join(re.findall(r"[A-Za-z0-9]+[A-Za-z0-9_]*", value.upper()))
    else:
        raise Exception(f"Unsupported enum value type: {value.__class__}")


def get_enums(schemas: Dict[str, Any]) -> List[Dict[str, Any]]:
    objects = {k: v for k, v in schemas.items() if "enum" in v}

    enums = []
    for _, o in objects.items():
        p: Dict[str, Any] = {}
        p["name"] = sanitize_name(o["title"])
        p["type"] = resolve_type(o)
        p["fields"] = [
            {
                "name": _enum_val_to_name(v),
                "value": serialize_to_python_code(v),
            }
            for v in o["enum"]
        ]
        enums.append(p)

    return enums


def generate_models(swagger: Dict[str, Any], out_file: Path) -> None:
    """
    Generate enums and Pydantic models from the dereferenced OpenAPI file.
    """
    schemas = swagger["components"]["schemas"]

    models = get_models(schemas)
    enums = get_enums(schemas)

    with open(templates_path / "models.py.mustache", "r") as f:
        models_str = chevron.render(f, {"enums": enums, "models": models})

    with open(out_file, "w+") as f:
        f.write(models_str)