From 4e768a212b8cd0e1df6f863393495bf284752a11 Mon Sep 17 00:00:00 2001 From: Luke Yang Date: Tue, 9 Apr 2024 20:09:23 -0400 Subject: [PATCH] BACK-2650: fix DataURIAdapter re plain text json data uri --- docs/changelog.md | 4 +++ docs/index.md | 2 +- offchain/metadata/adapters/data_uri.py | 5 +++ pyproject.toml | 2 +- tests/metadata/adapters/test_data_adapter.py | 35 ++++++++++++++++++++ 5 files changed, 46 insertions(+), 2 deletions(-) diff --git a/docs/changelog.md b/docs/changelog.md index f373ddb..d1776e1 100644 --- a/docs/changelog.md +++ b/docs/changelog.md @@ -1,5 +1,9 @@ # Changelog +## v0.3.2 + +- Fix an issue in `DataURIAdapter` where plain-text json data uri would get ignored + ## v0.3.1 - Trim token_uri in some log outputs, this is mainly useful for data uris that are too long and make logs unreadable diff --git a/docs/index.md b/docs/index.md index f1c3783..8630f6b 100644 --- a/docs/index.md +++ b/docs/index.md @@ -1,6 +1,6 @@ # Getting Started -Documentation for version: **v0.3.1** +Documentation for version: **v0.3.2** ## Overview diff --git a/offchain/metadata/adapters/data_uri.py b/offchain/metadata/adapters/data_uri.py index bcc9a48..094f928 100644 --- a/offchain/metadata/adapters/data_uri.py +++ b/offchain/metadata/adapters/data_uri.py @@ -3,6 +3,7 @@ from urllib.request import urlopen import httpx +import json from requests import PreparedRequest, Response from offchain.metadata.adapters.base_adapter import BaseAdapter @@ -17,6 +18,10 @@ def decode_data_url(data_url): # type: ignore[no-untyped-def] decoded_data = base64.b64decode(data) decoded_text = decoded_data.decode("utf-8") return decoded_text + elif "json;utf8" in data_parts[0]: + decoded_data = urlopen(data_url).read() + decoded_text = json.dumps(json.loads(decoded_data)) + return decoded_text return None diff --git a/pyproject.toml b/pyproject.toml index b602961..2e585c0 100644 --- a/pyproject.toml +++ b/pyproject.toml @@ -1,6 +1,6 @@ [tool.poetry] name = "offchain" -version = "0.3.1" +version = "0.3.2" description = "Open source metadata processing framework" authors = ["Zora eng "] readme = "README.md" diff --git a/tests/metadata/adapters/test_data_adapter.py b/tests/metadata/adapters/test_data_adapter.py index d21d409..25cacdb 100644 --- a/tests/metadata/adapters/test_data_adapter.py +++ b/tests/metadata/adapters/test_data_adapter.py @@ -1,4 +1,5 @@ import httpx +import json import pytest from pytest_httpx import HTTPXMock @@ -25,6 +26,25 @@ async def test_gen_head(self, httpx_mock: HTTPXMock): outgoing_request = httpx_mock.get_requests() assert not outgoing_request + @pytest.mark.asyncio + async def test_gen_head_not_base64(self, httpx_mock: HTTPXMock): + adapter = DataURIAdapter() + data_url = "data:application/json;utf8,{\"name\":\"here for now\",\"description\":\"sometimes i don't know how to feel when i'm away.\", \"image\": \"\"}" # noqa + async with httpx.AsyncClient() as client: + result = await adapter.gen_head(url=data_url, sess=client) + + expected = httpx.Response( + status_code=200, + headers={"content-type": "application/json;utf8", "content-length": "2600"}, + request=httpx.Request(method="HEAD", url=data_url), + ) + assert result.status_code == 200 + assert result.request.method == "HEAD" + assert result.headers == expected.headers + # no real request was made + outgoing_request = httpx_mock.get_requests() + assert not outgoing_request + @pytest.mark.asyncio async def test_gen_send(self, httpx_mock: HTTPXMock): adapter = DataURIAdapter() @@ -37,3 +57,18 @@ async def test_gen_send(self, httpx_mock: HTTPXMock): # no real request was made outgoing_request = httpx_mock.get_requests() assert not outgoing_request + + @pytest.mark.asyncio + async def test_gen_send_not_base64(self, httpx_mock: HTTPXMock): + adapter = DataURIAdapter() + json_str = "{\"name\":\"here for now\",\"description\":\"sometimes i don't know how to feel when i'm away.\", \"image\": \"\"}" # noqa + data_url = f"data:application/json;utf8,{json_str}" + async with httpx.AsyncClient() as client: + result = await adapter.gen_send(url=data_url, sess=client) + + assert result.status_code == 200 + assert result.request.method == "GET" + assert json.loads(result.text) == json.loads(json_str) + # no real request was made + outgoing_request = httpx_mock.get_requests() + assert not outgoing_request