From 087b57e15762346bc542a693afb17daf616faa22 Mon Sep 17 00:00:00 2001 From: Luke Yang Date: Tue, 9 Apr 2024 20:09:23 -0400 Subject: [PATCH] BACK-2650: fix DataURIAdapter re plain text json data uri --- docs/changelog.md | 4 +++ docs/index.md | 2 +- offchain/metadata/adapters/data_uri.py | 5 +++ pyproject.toml | 2 +- tests/metadata/adapters/test_data_adapter.py | 35 ++++++++++++++++++++ tests/metadata/parsers/test_zora_parser.py | 8 ++--- 6 files changed, 50 insertions(+), 6 deletions(-) diff --git a/docs/changelog.md b/docs/changelog.md index f373ddb..d1776e1 100644 --- a/docs/changelog.md +++ b/docs/changelog.md @@ -1,5 +1,9 @@ # Changelog +## v0.3.2 + +- Fix an issue in `DataURIAdapter` where plain-text json data uri would get ignored + ## v0.3.1 - Trim token_uri in some log outputs, this is mainly useful for data uris that are too long and make logs unreadable diff --git a/docs/index.md b/docs/index.md index f1c3783..8630f6b 100644 --- a/docs/index.md +++ b/docs/index.md @@ -1,6 +1,6 @@ # Getting Started -Documentation for version: **v0.3.1** +Documentation for version: **v0.3.2** ## Overview diff --git a/offchain/metadata/adapters/data_uri.py b/offchain/metadata/adapters/data_uri.py index bcc9a48..094f928 100644 --- a/offchain/metadata/adapters/data_uri.py +++ b/offchain/metadata/adapters/data_uri.py @@ -3,6 +3,7 @@ from urllib.request import urlopen import httpx +import json from requests import PreparedRequest, Response from offchain.metadata.adapters.base_adapter import BaseAdapter @@ -17,6 +18,10 @@ def decode_data_url(data_url): # type: ignore[no-untyped-def] decoded_data = base64.b64decode(data) decoded_text = decoded_data.decode("utf-8") return decoded_text + elif "json;utf8" in data_parts[0]: + decoded_data = urlopen(data_url).read() + decoded_text = json.dumps(json.loads(decoded_data)) + return decoded_text return None diff --git a/pyproject.toml b/pyproject.toml index b602961..2e585c0 100644 --- a/pyproject.toml +++ b/pyproject.toml @@ -1,6 +1,6 @@ [tool.poetry] name = "offchain" -version = "0.3.1" +version = "0.3.2" description = "Open source metadata processing framework" authors = ["Zora eng "] readme = "README.md" diff --git a/tests/metadata/adapters/test_data_adapter.py b/tests/metadata/adapters/test_data_adapter.py index d21d409..25cacdb 100644 --- a/tests/metadata/adapters/test_data_adapter.py +++ b/tests/metadata/adapters/test_data_adapter.py @@ -1,4 +1,5 @@ import httpx +import json import pytest from pytest_httpx import HTTPXMock @@ -25,6 +26,25 @@ async def test_gen_head(self, httpx_mock: HTTPXMock): outgoing_request = httpx_mock.get_requests() assert not outgoing_request + @pytest.mark.asyncio + async def test_gen_head_not_base64(self, httpx_mock: HTTPXMock): + adapter = DataURIAdapter() + data_url = "data:application/json;utf8,{\"name\":\"here for now\",\"description\":\"sometimes i don't know how to feel when i'm away.\", \"image\": \"\"}" # noqa + async with httpx.AsyncClient() as client: + result = await adapter.gen_head(url=data_url, sess=client) + + expected = httpx.Response( + status_code=200, + headers={"content-type": "application/json;utf8", "content-length": "2600"}, + request=httpx.Request(method="HEAD", url=data_url), + ) + assert result.status_code == 200 + assert result.request.method == "HEAD" + assert result.headers == expected.headers + # no real request was made + outgoing_request = httpx_mock.get_requests() + assert not outgoing_request + @pytest.mark.asyncio async def test_gen_send(self, httpx_mock: HTTPXMock): adapter = DataURIAdapter() @@ -37,3 +57,18 @@ async def test_gen_send(self, httpx_mock: HTTPXMock): # no real request was made outgoing_request = httpx_mock.get_requests() assert not outgoing_request + + @pytest.mark.asyncio + async def test_gen_send_not_base64(self, httpx_mock: HTTPXMock): + adapter = DataURIAdapter() + json_str = "{\"name\":\"here for now\",\"description\":\"sometimes i don't know how to feel when i'm away.\", \"image\": \"\"}" # noqa + data_url = f"data:application/json;utf8,{json_str}" + async with httpx.AsyncClient() as client: + result = await adapter.gen_send(url=data_url, sess=client) + + assert result.status_code == 200 + assert result.request.method == "GET" + assert json.loads(result.text) == json.loads(json_str) + # no real request was made + outgoing_request = httpx_mock.get_requests() + assert not outgoing_request diff --git a/tests/metadata/parsers/test_zora_parser.py b/tests/metadata/parsers/test_zora_parser.py index 3dd7ae8..ecc5110 100644 --- a/tests/metadata/parsers/test_zora_parser.py +++ b/tests/metadata/parsers/test_zora_parser.py @@ -19,7 +19,7 @@ class TestZoraParser: token = Token( chain_identifier="ETHEREUM-MAINNET", collection_address="0xabefbc9fd2f806065b4f3c237d4b59d9a97bcac7", - token_id=5769, + token_id=31861, ) raw_data = { @@ -46,8 +46,8 @@ def test_zora_parser_parses_metadata(self): # type: ignore[no-untyped-def] token=Token( chain_identifier="ETHEREUM-MAINNET", collection_address="0xabefbc9fd2f806065b4f3c237d4b59d9a97bcac7", - token_id=5769, - uri="https://zora-dev.mypinata.cloud/ipfs/bafkreigux6jujn5hvlmptgzgok4reaie2gkuvsk2kynnalsyfgr4g35dkm", + token_id=31861, + uri="https://gateway.pinata.cloud/ipfs/bafkreid3jq3mlqz4d3w7emkxpftmfjbbxtkwe7kf25lzp2krwcxfd57m6q", ), raw_data={ "description": "A Lonely Soul,\n\nI've felt lonely lately. Somewhere deep inside, detached. \n\nThere must be plenty of lost souls wandering the globe. Looking to belong; to understand their purpose.\n\nI know my purpose, but I fear I've burned up surviving to the moment.\n\nDoes this count?\nAm I still pushing forward?\n\nI hope so...\n\nDo I still have time?\nAm I just floating?\n\nPlease, don't give up.\n\nAge 23 (2021)\n4096x4096px", @@ -63,7 +63,7 @@ def test_zora_parser_parses_metadata(self): # type: ignore[no-untyped-def] image=MediaDetails( size=13548199, sha256=None, - uri="https://zora-dev.mypinata.cloud/ipfs/bafybeiffwxjez2axebcprj2h7wkohr2pdbvuv37f7uxyptuw7o6t5fvppu", + uri="https://gateway.pinata.cloud/ipfs/bafybeifavbhn6ys3k4tvngt4rxkoo7vabiv4lnlszwkvdncjg245qz5chq", mime_type="image/jpeg", ), content=None,