Skip to content

Commit 54d8603

Browse files
committed
Escape url parameters in sqlalchemy connection strings
1 parent cd614ff commit 54d8603

File tree

5 files changed

+262
-29
lines changed

5 files changed

+262
-29
lines changed

README.md

Lines changed: 15 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -72,8 +72,13 @@ NOTE: `password` and `schema` are optional
7272
from sqlalchemy import create_engine
7373
from sqlalchemy.schema import Table, MetaData
7474
from sqlalchemy.sql.expression import select, text
75+
from trino.sqlalchemy import URL
7576

76-
engine = create_engine('trino://user@localhost:8080/system')
77+
engine = create_engine(URL(
78+
host="localhost",
79+
port=8080,
80+
catalog="system"
81+
))
7782
connection = engine.connect()
7883

7984
rows = connection.execute(text("SELECT * FROM runtime.nodes")).fetchall()
@@ -93,6 +98,7 @@ Attributes can also be passed in the connection string.
9398

9499
```python
95100
from sqlalchemy import create_engine
101+
from trino.sqlalchemy import URL
96102

97103
engine = create_engine(
98104
'trino://user@localhost:8080/system',
@@ -110,6 +116,14 @@ engine = create_engine(
110116
'&client_tags=["tag1", "tag2"]'
111117
'&experimental_python_types=true',
112118
)
119+
120+
# or using the URL factory method
121+
engine = create_engine(URL(
122+
host="localhost",
123+
port=8080,
124+
client_tags=["tag1", "tag2"],
125+
experimental_python_types=True
126+
))
113127
```
114128

115129
## Authentication mechanisms

tests/unit/sqlalchemy/test_dialect.py

Lines changed: 135 additions & 15 deletions
Original file line numberDiff line numberDiff line change
@@ -9,27 +9,43 @@
99
from trino.dbapi import Connection
1010
from trino.sqlalchemy.dialect import CertificateAuthentication, JWTAuthentication, TrinoDialect
1111
from trino.transaction import IsolationLevel
12+
from trino.sqlalchemy import URL as trino_url
1213

1314

1415
class TestTrinoDialect:
1516
def setup(self):
1617
self.dialect = TrinoDialect()
1718

1819
@pytest.mark.parametrize(
19-
"url, expected_args, expected_kwargs",
20+
"url, generated_url, expected_args, expected_kwargs",
2021
[
2122
(
22-
make_url("trino://user@localhost"),
23+
make_url(trino_url(
24+
user="user",
25+
host="localhost",
26+
)),
27+
'trino://user@localhost:8080?source=trino-sqlalchemy',
2328
list(),
24-
dict(host="localhost", catalog="system", user="user", source="trino-sqlalchemy"),
29+
dict(host="localhost", catalog="system", user="user", port=8080, source="trino-sqlalchemy"),
2530
),
2631
(
27-
make_url("trino://user@localhost:8080"),
32+
make_url(trino_url(
33+
user="user",
34+
host="localhost",
35+
port=443,
36+
)),
37+
'trino://user@localhost:443?source=trino-sqlalchemy',
2838
list(),
29-
dict(host="localhost", port=8080, catalog="system", user="user", source="trino-sqlalchemy"),
39+
dict(host="localhost", port=443, catalog="system", user="user", source="trino-sqlalchemy"),
3040
),
3141
(
32-
make_url("trino://user:pass@localhost:8080?source=trino-rulez"),
42+
make_url(trino_url(
43+
user="user",
44+
password="pass",
45+
host="localhost",
46+
source="trino-rulez",
47+
)),
48+
'trino://user:***@localhost:8080?source=trino-rulez',
3349
list(),
3450
dict(
3551
host="localhost",
@@ -42,13 +58,64 @@ def setup(self):
4258
),
4359
),
4460
(
45-
make_url(
46-
'trino://user@localhost:8080?'
47-
'session_properties={"query_max_run_time": "1d"}'
48-
'&http_headers={"trino": 1}'
49-
'&extra_credential=[("a", "b"), ("c", "d")]'
50-
'&client_tags=[1, "sql"]'
51-
'&experimental_python_types=true'),
61+
make_url(trino_url(
62+
user="user",
63+
host="localhost",
64+
cert="/my/path/to/cert",
65+
key="afdlsdfk%4#'",
66+
)),
67+
'trino://user@localhost:8080'
68+
'?cert=%2Fmy%2Fpath%2Fto%2Fcert'
69+
'&key=afdlsdfk%254%23%27'
70+
'&source=trino-sqlalchemy',
71+
list(),
72+
dict(
73+
host="localhost",
74+
port=8080,
75+
catalog="system",
76+
user="user",
77+
auth=CertificateAuthentication("/my/path/to/cert", "afdlsdfk%4#'"),
78+
http_scheme="https",
79+
source="trino-sqlalchemy"
80+
),
81+
),
82+
(
83+
make_url(trino_url(
84+
user="user",
85+
host="localhost",
86+
access_token="afdlsdfk%4#'",
87+
)),
88+
'trino://user@localhost:8080'
89+
'?access_token=afdlsdfk%254%23%27'
90+
'&source=trino-sqlalchemy',
91+
list(),
92+
dict(
93+
host="localhost",
94+
port=8080,
95+
catalog="system",
96+
user="user",
97+
auth=JWTAuthentication("afdlsdfk%4#'"),
98+
http_scheme="https",
99+
source="trino-sqlalchemy"
100+
),
101+
),
102+
(
103+
make_url(trino_url(
104+
user="user",
105+
host="localhost",
106+
session_properties={"query_max_run_time": "1d"},
107+
http_headers={"trino": 1},
108+
extra_credential=[("a", "b"), ("c", "d")],
109+
client_tags=["1", "sql"],
110+
experimental_python_types=True,
111+
)),
112+
'trino://user@localhost:8080'
113+
'?client_tags=%5B%221%22%2C+%22sql%22%5D'
114+
'&experimental_python_types=true'
115+
'&extra_credential=%5B%28%27a%27%2C+%27b%27%29%2C+%28%27c%27%2C+%27d%27%29%5D'
116+
'&http_headers=%7B%22trino%22%3A+1%7D'
117+
'&session_properties=%7B%22query_max_run_time%22%3A+%221d%22%7D'
118+
'&source=trino-sqlalchemy',
52119
list(),
53120
dict(
54121
host="localhost",
@@ -59,13 +126,66 @@ def setup(self):
59126
session_properties={"query_max_run_time": "1d"},
60127
http_headers={"trino": 1},
61128
extra_credential=[("a", "b"), ("c", "d")],
62-
client_tags=[1, "sql"],
129+
client_tags=["1", "sql"],
63130
experimental_python_types=True,
64131
),
65132
),
133+
# url encoding
134+
(
135+
make_url(trino_url(
136+
user="[email protected]/my_role",
137+
password="pass /*&",
138+
host="localhost",
139+
session_properties={"query_max_run_time": "1d"},
140+
http_headers={"trino": 1},
141+
extra_credential=[
142+
("[email protected]/my_role", "[email protected]/my_role"),
143+
("[email protected]/my_role", "[email protected]/my_role")],
144+
experimental_python_types=True,
145+
client_tags=["1 @& /\"", "sql"],
146+
verify=False,
147+
)),
148+
'trino://user%40test.org%2Fmy_role:***@localhost:8080'
149+
'?client_tags=%5B%221+%40%26+%2F%5C%22%22%2C+%22sql%22%5D'
150+
'&experimental_python_types=true'
151+
'&extra_credential=%5B%28%27user1%40test.org%2Fmy_role%27%2C'
152+
'+%27user2%40test.org%2Fmy_role%27%29%2C'
153+
'+%28%27user3%40test.org%2Fmy_role%27%2C'
154+
'+%27user36%40test.org%2Fmy_role%27%29%5D'
155+
'&http_headers=%7B%22trino%22%3A+1%7D'
156+
'&session_properties=%7B%22query_max_run_time%22%3A+%221d%22%7D'
157+
'&source=trino-sqlalchemy'
158+
'&verify=false',
159+
list(),
160+
dict(
161+
host="localhost",
162+
port=8080,
163+
catalog="system",
164+
user="[email protected]/my_role",
165+
auth=BasicAuthentication("[email protected]/my_role", "pass /*&"),
166+
http_scheme="https",
167+
source="trino-sqlalchemy",
168+
session_properties={"query_max_run_time": "1d"},
169+
http_headers={"trino": 1},
170+
extra_credential=[
171+
("[email protected]/my_role", "[email protected]/my_role"),
172+
("[email protected]/my_role", "[email protected]/my_role")],
173+
experimental_python_types=True,
174+
client_tags=["1 @& /\"", "sql"],
175+
verify=False,
176+
),
177+
),
66178
],
67179
)
68-
def test_create_connect_args(self, url: URL, expected_args: List[Any], expected_kwargs: Dict[str, Any]):
180+
def test_create_connect_args(
181+
self,
182+
url: URL,
183+
generated_url: str,
184+
expected_args: List[Any],
185+
expected_kwargs: Dict[str, Any]
186+
):
187+
assert repr(url) == generated_url
188+
69189
actual_args, actual_kwargs = self.dialect.create_connect_args(url)
70190

71191
assert actual_args == expected_args

trino/sqlalchemy/__init__.py

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -10,5 +10,6 @@
1010
# See the License for the specific language governing permissions and
1111
# limitations under the License.
1212
from sqlalchemy.dialects import registry
13+
from .util import _url as URL # noqa
1314

1415
registry.register("trino", "trino.sqlalchemy.dialect", "TrinoDialect")

trino/sqlalchemy/dialect.py

Lines changed: 17 additions & 13 deletions
Original file line numberDiff line numberDiff line change
@@ -13,6 +13,7 @@
1313
from ast import literal_eval
1414
from textwrap import dedent
1515
from typing import Any, Dict, List, Mapping, Optional, Sequence, Tuple
16+
from urllib.parse import unquote_plus, unquote
1617

1718
from sqlalchemy import exc, sql
1819
from sqlalchemy.engine.base import Connection
@@ -80,49 +81,52 @@ def create_connect_args(self, url: URL) -> Tuple[Sequence[Any], Mapping[str, Any
8081

8182
db_parts = (url.database or "system").split("/")
8283
if len(db_parts) == 1:
83-
kwargs["catalog"] = db_parts[0]
84+
kwargs["catalog"] = unquote_plus(db_parts[0])
8485
elif len(db_parts) == 2:
85-
kwargs["catalog"] = db_parts[0]
86-
kwargs["schema"] = db_parts[1]
86+
kwargs["catalog"] = unquote_plus(db_parts[0])
87+
kwargs["schema"] = unquote_plus(db_parts[1])
8788
else:
8889
raise ValueError(f"Unexpected database format {url.database}")
8990

9091
if url.username:
91-
kwargs["user"] = url.username
92+
kwargs["user"] = unquote(url.username)
9293

9394
if url.password:
9495
if not url.username:
9596
raise ValueError("Username is required when specify password in connection URL")
9697
kwargs["http_scheme"] = "https"
97-
kwargs["auth"] = BasicAuthentication(url.username, url.password)
98+
kwargs["auth"] = BasicAuthentication(unquote(url.username), unquote(url.password))
9899

99100
if "access_token" in url.query:
100101
kwargs["http_scheme"] = "https"
101-
kwargs["auth"] = JWTAuthentication(url.query["access_token"])
102+
kwargs["auth"] = JWTAuthentication(unquote(url.query["access_token"]))
102103

103104
if "cert" and "key" in url.query:
104105
kwargs["http_scheme"] = "https"
105-
kwargs["auth"] = CertificateAuthentication(url.query['cert'], url.query['key'])
106+
kwargs["auth"] = CertificateAuthentication(unquote(url.query['cert']), unquote(url.query['key']))
106107

107108
if "source" in url.query:
108-
kwargs["source"] = url.query["source"]
109+
kwargs["source"] = unquote(url.query["source"])
109110
else:
110111
kwargs["source"] = "trino-sqlalchemy"
111112

112113
if "session_properties" in url.query:
113-
kwargs["session_properties"] = json.loads(url.query["session_properties"])
114+
kwargs["session_properties"] = json.loads(unquote(url.query["session_properties"]))
114115

115116
if "http_headers" in url.query:
116-
kwargs["http_headers"] = json.loads(url.query["http_headers"])
117+
kwargs["http_headers"] = json.loads(unquote(url.query["http_headers"]))
117118

118119
if "extra_credential" in url.query:
119-
kwargs["extra_credential"] = literal_eval(url.query["extra_credential"])
120+
kwargs["extra_credential"] = literal_eval(unquote(url.query["extra_credential"]))
120121

121122
if "client_tags" in url.query:
122-
kwargs["client_tags"] = json.loads(url.query["client_tags"])
123+
kwargs["client_tags"] = json.loads(unquote(url.query["client_tags"]))
123124

124125
if "experimental_python_types" in url.query:
125-
kwargs["experimental_python_types"] = json.loads(url.query["experimental_python_types"])
126+
kwargs["experimental_python_types"] = json.loads(unquote(url.query["experimental_python_types"]))
127+
128+
if "verify" in url.query:
129+
kwargs["verify"] = json.loads(unquote(url.query["verify"]))
126130

127131
return args, kwargs
128132

0 commit comments

Comments
 (0)