From 9693f8d3c180ad82ec6c31e0d0481ea85b85af24 Mon Sep 17 00:00:00 2001 From: Luke Yang Date: Fri, 19 Jul 2024 18:02:19 -0400 Subject: [PATCH 1/2] BACK-3396: allow data uri containing a json to omit utf-8 --- docs/changelog.md | 4 ++ docs/index.md | 2 +- offchain/metadata/adapters/data_uri.py | 2 +- pyproject.toml | 2 +- tests/metadata/adapters/test_data_adapter.py | 39 +++++++++++++++++++- 5 files changed, 44 insertions(+), 5 deletions(-) diff --git a/docs/changelog.md b/docs/changelog.md index a2569c2..647e86e 100644 --- a/docs/changelog.md +++ b/docs/changelog.md @@ -1,5 +1,9 @@ # Changelog +## v0.3.5 + +- Allow data uri containing a json to omit "utf-8" encoding + ## v0.3.4 - Fix Nouns parser to make sure image uri is properly base64-encoded svg diff --git a/docs/index.md b/docs/index.md index 57befb7..3e14c01 100644 --- a/docs/index.md +++ b/docs/index.md @@ -1,6 +1,6 @@ # Getting Started -Documentation for version: **v0.3.4** +Documentation for version: **v0.3.5** ## Overview diff --git a/offchain/metadata/adapters/data_uri.py b/offchain/metadata/adapters/data_uri.py index 094f928..d4c2043 100644 --- a/offchain/metadata/adapters/data_uri.py +++ b/offchain/metadata/adapters/data_uri.py @@ -18,7 +18,7 @@ def decode_data_url(data_url): # type: ignore[no-untyped-def] decoded_data = base64.b64decode(data) decoded_text = decoded_data.decode("utf-8") return decoded_text - elif "json;utf8" in data_parts[0]: + elif "json;utf8" in data_parts[0] or "json" in data_parts[0]: decoded_data = urlopen(data_url).read() decoded_text = json.dumps(json.loads(decoded_data)) return decoded_text diff --git a/pyproject.toml b/pyproject.toml index 7e7acce..2315ce5 100644 --- a/pyproject.toml +++ b/pyproject.toml @@ -1,6 +1,6 @@ [tool.poetry] name = "offchain" -version = "0.3.4" +version = "0.3.5" description = "Open source metadata processing framework" authors = ["Zora eng "] readme = "README.md" diff --git a/tests/metadata/adapters/test_data_adapter.py b/tests/metadata/adapters/test_data_adapter.py index 25cacdb..2e046d2 100644 --- a/tests/metadata/adapters/test_data_adapter.py +++ b/tests/metadata/adapters/test_data_adapter.py @@ -29,7 +29,7 @@ async def test_gen_head(self, httpx_mock: HTTPXMock): @pytest.mark.asyncio async def test_gen_head_not_base64(self, httpx_mock: HTTPXMock): adapter = DataURIAdapter() - data_url = "data:application/json;utf8,{\"name\":\"here for now\",\"description\":\"sometimes i don't know how to feel when i'm away.\", \"image\": \"\"}" # noqa + data_url = 'data:application/json;utf8,{"name":"here for now","description":"sometimes i don\'t know how to feel when i\'m away.", "image": ""}' # noqa async with httpx.AsyncClient() as client: result = await adapter.gen_head(url=data_url, sess=client) @@ -45,6 +45,26 @@ async def test_gen_head_not_base64(self, httpx_mock: HTTPXMock): outgoing_request = httpx_mock.get_requests() assert not outgoing_request + @pytest.mark.asyncio + async def test_gen_head_json_unspecified_encoding(self, httpx_mock: HTTPXMock): + adapter = DataURIAdapter() + json_str = '{"name":"here for now","description":"sometimes i don\'t know how to feel when i\'m away.", "image": ""}' # noqa + data_url = f"data:application/json,{json_str}" + async with httpx.AsyncClient() as client: + result = await adapter.gen_head(url=data_url, sess=client) + + expected = httpx.Response( + status_code=200, + headers={"content-type": "application/json", "content-length": "2600"}, + request=httpx.Request(method="HEAD", url=data_url), + ) + assert result.status_code == 200 + assert result.request.method == "HEAD" + assert result.headers == expected.headers + # no real request was made + outgoing_request = httpx_mock.get_requests() + assert not outgoing_request + @pytest.mark.asyncio async def test_gen_send(self, httpx_mock: HTTPXMock): adapter = DataURIAdapter() @@ -61,7 +81,7 @@ async def test_gen_send(self, httpx_mock: HTTPXMock): @pytest.mark.asyncio async def test_gen_send_not_base64(self, httpx_mock: HTTPXMock): adapter = DataURIAdapter() - json_str = "{\"name\":\"here for now\",\"description\":\"sometimes i don't know how to feel when i'm away.\", \"image\": \"\"}" # noqa + json_str = '{"name":"here for now","description":"sometimes i don\'t know how to feel when i\'m away.", "image": ""}' # noqa data_url = f"data:application/json;utf8,{json_str}" async with httpx.AsyncClient() as client: result = await adapter.gen_send(url=data_url, sess=client) @@ -72,3 +92,18 @@ async def test_gen_send_not_base64(self, httpx_mock: HTTPXMock): # no real request was made outgoing_request = httpx_mock.get_requests() assert not outgoing_request + + @pytest.mark.asyncio + async def test_gen_send_json_unspecified_encoding(self, httpx_mock: HTTPXMock): + adapter = DataURIAdapter() + json_str = '{"name":"here for now","description":"sometimes i don\'t know how to feel when i\'m away.", "image": ""}' # noqa + data_url = f"data:application/json,{json_str}" + async with httpx.AsyncClient() as client: + result = await adapter.gen_send(url=data_url, sess=client) + + assert result.status_code == 200 + assert result.request.method == "GET" + assert json.loads(result.text) == json.loads(json_str) + # no real request was made + outgoing_request = httpx_mock.get_requests() + assert not outgoing_request From 45b23b8ce10826cf3acad7a5e8d2279fee12fe55 Mon Sep 17 00:00:00 2001 From: Luke Yang Date: Mon, 5 Aug 2024 11:57:47 -0700 Subject: [PATCH 2/2] BACK-3396: fix unit test --- offchain/metadata/adapters/data_uri.py | 2 +- tests/metadata/fetchers/test_metadata_fetcher.py | 12 +++++++++++- 2 files changed, 12 insertions(+), 2 deletions(-) diff --git a/offchain/metadata/adapters/data_uri.py b/offchain/metadata/adapters/data_uri.py index d4c2043..d773f61 100644 --- a/offchain/metadata/adapters/data_uri.py +++ b/offchain/metadata/adapters/data_uri.py @@ -18,7 +18,7 @@ def decode_data_url(data_url): # type: ignore[no-untyped-def] decoded_data = base64.b64decode(data) decoded_text = decoded_data.decode("utf-8") return decoded_text - elif "json;utf8" in data_parts[0] or "json" in data_parts[0]: + elif "json" in data_parts[0]: decoded_data = urlopen(data_url).read() decoded_text = json.dumps(json.loads(decoded_data)) return decoded_text diff --git a/tests/metadata/fetchers/test_metadata_fetcher.py b/tests/metadata/fetchers/test_metadata_fetcher.py index 67240d7..59c1819 100644 --- a/tests/metadata/fetchers/test_metadata_fetcher.py +++ b/tests/metadata/fetchers/test_metadata_fetcher.py @@ -28,7 +28,17 @@ async def test_gen_fetch_data_adapter(self): # type: ignore[no-untyped-def] @pytest.mark.asyncio async def test_gen_fetch_ipfs_adapter(self): # type: ignore[no-untyped-def] - fetcher = MetadataFetcher() + fetcher = MetadataFetcher( + async_adapter_configs=[ + AdapterConfig( + adapter_cls=IPFSAdapter, + mount_prefixes=[ + "ipfs://", + ], + host_prefixes=["https://ipfs.decentralized-content.com/ipfs/"], + ), + ] + ) content = await fetcher.gen_fetch_content( "ipfs://bafkreiboyxwytfyufln3uzyzaixslzvmrqs5ezjo2cio2fymfqf6u57u6u" # noqa )