forked from openapi-generators/openapi-python-client
-
Notifications
You must be signed in to change notification settings - Fork 0
Expand file tree
/
Copy pathutils.py
More file actions
123 lines (86 loc) · 3.86 KB
/
utils.py
File metadata and controls
123 lines (86 loc) · 3.86 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
from __future__ import annotations
import builtins
import re
from email.message import Message
from keyword import iskeyword
from typing import Any
from .config import Config
DELIMITERS = r"\. _-"
class PythonIdentifier(str):
"""A snake_case string which has been validated / transformed into a valid identifier for Python"""
def __new__(cls, value: str, prefix: str, skip_snake_case: bool = False) -> PythonIdentifier:
new_value = sanitize(value)
if not skip_snake_case:
new_value = snake_case(new_value)
new_value = fix_reserved_words(new_value)
if not new_value.isidentifier() or value.startswith("_"):
new_value = f"{prefix}{new_value}"
return str.__new__(cls, new_value)
def __deepcopy__(self, _: Any) -> PythonIdentifier:
return self
class ClassName(str):
"""A PascalCase string which has been validated / transformed into a valid class name for Python"""
def __new__(cls, value: str, prefix: str) -> ClassName:
new_value = fix_reserved_words(pascal_case(sanitize(value)))
if not new_value.isidentifier():
value = f"{prefix}{new_value}"
new_value = fix_reserved_words(pascal_case(sanitize(value)))
return str.__new__(cls, new_value)
def __deepcopy__(self, _: Any) -> ClassName:
return self
def sanitize(value: str) -> str:
"""Removes every character that isn't 0-9, A-Z, a-z, or a known delimiter"""
return re.sub(rf"[^\w{DELIMITERS}]+", "", value)
def split_words(value: str) -> list[str]:
"""Split a string on words and known delimiters"""
# We can't guess words if there is no capital letter
if any(c.isupper() for c in value):
value = " ".join(re.split("([A-Z]?[a-z]+)", value))
return re.findall(rf"[^{DELIMITERS}]+", value)
RESERVED_WORDS = (set(dir(builtins)) | {"self", "true", "false", "datetime"}) - {
"type",
"id",
}
def fix_reserved_words(value: str) -> str:
"""
Using reserved Python words as identifiers in generated code causes problems, so this function renames them.
Args:
value: The identifier to-be that should be renamed if it's a reserved word.
Returns:
`value` suffixed with `_` if it was a reserved word.
"""
if value in RESERVED_WORDS or iskeyword(value):
return f"{value}_"
return value
def snake_case(value: str) -> str:
"""Converts to snake_case"""
words = split_words(sanitize(value))
return "_".join(words).lower()
def pascal_case(value: str) -> str:
"""Converts to PascalCase"""
words = split_words(sanitize(value))
capitalized_words = (word.capitalize() if not word.isupper() else word for word in words)
return "".join(capitalized_words)
def kebab_case(value: str) -> str:
"""Converts to kebab-case"""
words = split_words(sanitize(value))
return "-".join(words).lower()
def remove_string_escapes(value: str) -> str:
"""Used when parsing string-literal defaults to prevent escaping the string to write arbitrary Python
**REMOVING OR CHANGING THE USAGE OF THIS FUNCTION HAS SECURITY IMPLICATIONS**
See Also:
- https://github.com/openapi-generators/openapi-python-client/security/advisories/GHSA-9x4c-63pf-525f
"""
return value.replace('"', r"\"")
def get_content_type(content_type: str, config: Config) -> str | None:
"""
Given a string representing a content type with optional parameters, returns the content type only
"""
content_type = config.content_type_overrides.get(content_type, content_type)
message = Message()
message.add_header("Content-Type", content_type)
parsed_content_type = message.get_content_type()
if not content_type.startswith(parsed_content_type):
# Always defaults to `text/plain` if it's not recognized. We want to return an error, not default.
return None
return parsed_content_type