feat: Store image data keyed by URL query param
This commit is contained in:
parent
b8a65a8dd4
commit
d3f38b426d
|
@ -1,4 +1,7 @@
|
||||||
import json
|
import json
|
||||||
|
from urllib.parse import urlparse, parse_qs
|
||||||
|
|
||||||
|
data = {}
|
||||||
|
|
||||||
def main():
|
def main():
|
||||||
"""
|
"""
|
||||||
|
@ -14,7 +17,6 @@ def main():
|
||||||
print("No entries found in the HAR file.")
|
print("No entries found in the HAR file.")
|
||||||
return
|
return
|
||||||
|
|
||||||
print("Files found in the HAR archive:")
|
|
||||||
for entry in entries:
|
for entry in entries:
|
||||||
response = entry.get('response', {})
|
response = entry.get('response', {})
|
||||||
content = response.get('content', {})
|
content = response.get('content', {})
|
||||||
|
@ -23,14 +25,30 @@ def main():
|
||||||
if not mime_type.startswith('image/'):
|
if not mime_type.startswith('image/'):
|
||||||
continue
|
continue
|
||||||
|
|
||||||
request = entry.get('request', {})
|
request_obj = entry.get('request', {})
|
||||||
url = request.get('url')
|
request_url_str = request_obj.get('url')
|
||||||
if url:
|
|
||||||
print(url)
|
if not request_url_str:
|
||||||
else:
|
# If the entry's main request URL is missing, skip.
|
||||||
# This case might be less likely if we are filtering by mimeType,
|
continue
|
||||||
# but kept for robustness if an image entry somehow lacks a URL.
|
|
||||||
print("Image entry found with no request URL.")
|
parsed_request_url = urlparse(request_url_str)
|
||||||
|
query_params = parse_qs(parsed_request_url.query)
|
||||||
|
|
||||||
|
# The key for our 'data' dict is the value of the 'url' query parameter
|
||||||
|
# from the request's URL string.
|
||||||
|
key_from_query_param = query_params.get('url', [None])[0]
|
||||||
|
|
||||||
|
if not key_from_query_param:
|
||||||
|
# If the 'url' query parameter is not found in the request_url_str, skip.
|
||||||
|
continue
|
||||||
|
|
||||||
|
# The value for our 'data' dict is the response's base64 encoded text.
|
||||||
|
response_text = content.get('text')
|
||||||
|
|
||||||
|
if response_text is not None:
|
||||||
|
# Ensure response_text is not None (it can be an empty string for 0-byte files)
|
||||||
|
data[key_from_query_param] = response_text
|
||||||
|
|
||||||
|
|
||||||
if __name__ == "__main__":
|
if __name__ == "__main__":
|
||||||
|
|
Loading…
Reference in New Issue
Block a user