Skip to content

Commit

Permalink
fix: JSON decode error
Browse files Browse the repository at this point in the history
  • Loading branch information
lxndrblz committed Jun 29, 2024
1 parent feadb6a commit bcbae9b
Show file tree
Hide file tree
Showing 3 changed files with 19 additions and 16 deletions.
7 changes: 1 addition & 6 deletions .github/workflows/build.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -39,9 +39,4 @@ jobs:
python tools/main.py --help
python tools/dump_leveldb.py --help
python tools/dump_localstorage.py --help
python tools/dump_sessionstorage.py --help
- name: Calculate diff 👽
run: |
git diff --no-index --word-diff .\forensicsim-data\expected-result\jane_doe_v_1_4_00_11161.json jane_doe_v_1_4_00_11161.json
git diff --no-index --word-diff .\forensicsim-data\expected-result\john_doe_v_1_4_00_11161.json john_doe_v_1_4_00_11161.json
git diff --no-index --word-diff .\forensicsim-data\expected-result\karelze_v_23306_3309_2530_1346.json karelze_v_23306_3309_2530_1346.json
python tools/dump_sessionstorage.py --help
2 changes: 1 addition & 1 deletion src/forensicsim/backend.py
Original file line number Diff line number Diff line change
Expand Up @@ -129,7 +129,7 @@ def write_results_to_json(data: list[dict[str, Any]], outputpath: Path) -> None:
try:
with open(outputpath, "w", encoding="utf-8") as f:
json.dump(
data, f, indent=4, sort_keys=True, default=str, ensure_ascii=False
data, f, indent=4, default=str, ensure_ascii=False
)
except OSError as e:
print(e)
26 changes: 17 additions & 9 deletions src/forensicsim/parser.py
Original file line number Diff line number Diff line change
Expand Up @@ -2,6 +2,7 @@
import warnings
from dataclasses import dataclass, field
from datetime import datetime
from json import JSONDecodeError
from pathlib import Path
from typing import Any, Optional, Union

Expand All @@ -26,15 +27,22 @@ def strip_html_tags(value: str) -> str:


def decode_dict(properties: Union[bytes, str, dict]) -> dict[str, Any]:
if isinstance(properties, bytes):
soup = BeautifulSoup(properties, features="html.parser")
properties = properties.decode(soup.original_encoding)
if isinstance(properties, dict):
# handle case where nested childs are dicts or list but provided with "" but have to be expanded.
for key, value in properties.items():
if isinstance(value, str) and value.startswith(("[", "{")):
properties[key] = json.loads(value, strict=False)
return properties
try:
if isinstance(properties, bytes):
soup = BeautifulSoup(properties, features="html.parser")
properties = properties.decode(
encoding=soup.original_encoding, errors="ignore"
)
if isinstance(properties, dict):
# handle case where nested childs are dicts or list but provided with "" but have to be expanded.
for key, value in properties.items():
if isinstance(value, str) and value.startswith(("[", "{")):
properties[key] = json.loads(value, strict=False)
return properties
except JSONDecodeError as e:
print(e)
print("Couldn't decode dictionary ", properties)
return {}

return json.loads(properties, strict=False)

Expand Down

0 comments on commit bcbae9b

Please sign in to comment.