-
-
Notifications
You must be signed in to change notification settings - Fork 227
/
Copy pathutils.py
75 lines (49 loc) · 1.91 KB
/
utils.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
import builtins
import re
from keyword import iskeyword
from typing import List
delimiters = " _-"
def sanitize(value: str) -> str:
"""Removes every character that isn't 0-9, A-Z, a-z, or a known delimiter"""
return re.sub(rf"[^\w{delimiters}]+", "", value)
def split_words(value: str) -> List[str]:
"""Split a string on non-capital letters and known delimiters"""
value = " ".join(re.split("([A-Z]?[a-z]+)", value))
return re.findall(rf"[^{delimiters}]+", value)
def fix_keywords(value: str) -> str:
if iskeyword(value):
return f"{value}_"
return value
RESERVED_WORDS = (set(dir(builtins)) | {"self"}) - {"type", "id"}
def fix_reserved_words(value: str) -> str:
if value in RESERVED_WORDS:
return f"{value}_"
return value
def snake_case(value: str) -> str:
words = split_words(sanitize(value))
value = "_".join(words).lower()
return fix_keywords(value)
def pascal_case(value: str) -> str:
words = split_words(sanitize(value))
capitalized_words = (word.capitalize() if not word.isupper() else word for word in words)
value = "".join(capitalized_words)
return fix_keywords(value)
def kebab_case(value: str) -> str:
words = split_words(sanitize(value))
value = "-".join(words).lower()
return fix_keywords(value)
def remove_string_escapes(value: str) -> str:
return value.replace('"', r"\"")
# This can be changed by config.Config.load_config
FIELD_PREFIX = "field_"
def to_valid_python_identifier(value: str) -> str:
"""
Given a string, attempt to coerce it into a valid Python identifier by stripping out invalid characters and, if
necessary, prepending a prefix.
See:
https://docs.python.org/3/reference/lexical_analysis.html#identifiers
"""
new_value = fix_reserved_words(fix_keywords(sanitize(value)))
if new_value.isidentifier():
return new_value
return f"{FIELD_PREFIX}{new_value}"