onekey-sec · e3krisztian · May 9, 2022 · Apr 7, 2022 · Apr 7, 2022 · Apr 7, 2022
diff --git a/.github/workflows/build-publish-image.yml b/.github/workflows/build-publish-image.yml
@@ -52,7 +52,7 @@ jobs:
         run: docker run --rm ${{ env.DOCKER_IMAGE }} --show-external-dependencies
 
       - name: Check unblob - run for a file with --verbose
-        run: docker run --rm -v "$(pwd)"/tests/integration/archive/zip/regular:/test ${{ env.DOCKER_IMAGE }} -v -e /tmp /test
+        run: docker run --rm -v "$(pwd)"/tests/integration/archive/zip/regular:/test ${{ env.DOCKER_IMAGE }} -v -e /tmp /test/__input__/apple.zip
 
       - name: Build and push
         if: ${{ github.event_name == 'push' && github.ref_name == 'main' }}

diff --git a/.github/workflows/main.yml b/.github/workflows/main.yml
@@ -66,4 +66,4 @@ jobs:
         uses: ./.github/actions/setup-git-lfs
 
       - name: Run pytest
-        run: poetry run pytest
+        run: poetry run pytest -vvv
diff --git a/default.nix b/default.nix
@@ -111,7 +111,7 @@ self // {
 
         # romfs sample file contains some funky symlinks which get
         # removed when source is copyed to the nix store.
-        pytest -k "not test_all_handlers[filesystem.romfs]" --no-cov
+        pytest -vvv -k "not test_all_handlers[filesystem.romfs]" --no-cov
       )
     '';
   });

diff --git a/tests/conftest.py b/tests/conftest.py
@@ -1,15 +1,15 @@
-from unblob.extractors import Command
-from unblob.models import Handler, HexString
+from pathlib import Path
+
+import pytest
+
+from unblob.models import Task, TaskResult
 from unblob.testing import (  # noqa: F401 (module imported but unused)
     configure_logging,
     extraction_config,
 )
 
 
-class TestHandler(Handler):
-    NAME = "test_handler"
-    PATTERNS = [HexString("21 3C")]
-    EXTRACTOR = Command("testcommand", "for", "test", "handler")
-
-    def calculate_chunk(self, *args, **kwargs):
-        pass
+@pytest.fixture
+def task_result():
+    task = Task(path=Path("/nonexistent"), depth=0, chunk_id="")
+    return TaskResult(task)
diff --git a/tests/extractors/test_command.py b/tests/extractors/test_command.py
@@ -51,7 +51,6 @@ def test_command_execution_failure(tmpdir: Path):
     except ExtractError as e:
         assert list(e.reports) == [
             ExtractCommandFailedReport(
-                handler=None,
                 command=mock.ANY,
                 stdout=b"stdout",
                 stderr=b"stderr",
@@ -70,7 +69,6 @@ def test_command_not_found(tmpdir: Path):
     except ExtractError as e:
         assert list(e.reports) == [
             ExtractorDependencyNotFoundReport(
-                handler=None,
                 dependencies=["this-command-should-not-exist-in-any-system"],
             )
         ]
diff --git a/tests/test_cleanup.py b/tests/test_cleanup.py
@@ -9,7 +9,8 @@
 import pytest
 
 from unblob.models import File, Handler, Regex, ValidChunk
-from unblob.processing import ExtractionConfig, process_files
+from unblob.processing import ExtractionConfig, process_file
+from unblob.testing import check_result
 
 _ZIP_CONTENT = b"good file"
 # replacing _ZIP_CONTENT with _DAMAGED_ZIP_CONTENT will result in CRC error at unpacking time
@@ -33,10 +34,8 @@ def wrapzip(filename: str, content: bytes) -> bytes:
 
 
 @pytest.fixture()
-def input_dir(tmp_path: Path):
-    input_dir = tmp_path / "input"
-    input_dir.mkdir()
-    return input_dir
+def input_file(tmp_path: Path):
+    return tmp_path / "input_file"
 
 
 @pytest.fixture()
@@ -46,41 +45,41 @@ def output_dir(tmp_path):
     return output_dir
 
 
-def test_remove_extracted_chunks(input_dir: Path, output_dir: Path):
-    (input_dir / "blob").write_bytes(ZIP_BYTES)
+def test_remove_extracted_chunks(input_file: Path, output_dir: Path):
+    input_file.write_bytes(ZIP_BYTES)
     config = ExtractionConfig(
         extract_root=output_dir,
         entropy_depth=0,
     )
 
-    all_reports = process_files(config, input_dir)
+    all_reports = process_file(config, input_file)
     assert list(output_dir.glob("**/*.zip")) == []
-    assert all_reports == [], f"Unexpected error reports: {all_reports}"
+    check_result(all_reports)
 
 
-def test_keep_all_problematic_chunks(input_dir: Path, output_dir: Path):
-    (input_dir / "blob").write_bytes(DAMAGED_ZIP_BYTES)
+def test_keep_all_problematic_chunks(input_file: Path, output_dir: Path):
+    input_file.write_bytes(DAMAGED_ZIP_BYTES)
     config = ExtractionConfig(
         extract_root=output_dir,
         entropy_depth=0,
     )
 
-    all_reports = process_files(config, input_dir)
+    all_reports = process_file(config, input_file)
     # damaged zip file should not be removed
-    assert all_reports != [], "Unexpectedly no errors found!"
+    assert all_reports.errors != [], "Unexpectedly no errors found!"
     assert list(output_dir.glob("**/*.zip"))
 
 
-def test_keep_all_unknown_chunks(input_dir: Path, output_dir: Path):
-    (input_dir / "blob").write_bytes(b"unknown1" + ZIP_BYTES + b"unknown2")
+def test_keep_all_unknown_chunks(input_file: Path, output_dir: Path):
+    input_file.write_bytes(b"unknown1" + ZIP_BYTES + b"unknown2")
     config = ExtractionConfig(
         extract_root=output_dir,
         entropy_depth=0,
     )
 
-    all_reports = process_files(config, input_dir)
+    all_reports = process_file(config, input_file)
     assert list(output_dir.glob("**/*.unknown"))
-    assert all_reports == [], f"Unexpected error reports: {all_reports}"
+    check_result(all_reports)
 
 
 class _HandlerWithNullExtractor(Handler):
@@ -92,13 +91,13 @@ def calculate_chunk(self, file: File, start_offset: int) -> ValidChunk:
         return ValidChunk(start_offset=start_offset, end_offset=start_offset + 1)
 
 
-def test_keep_chunks_with_null_extractor(input_dir: Path, output_dir: Path):
-    (input_dir / "blob").write_text("some text")
+def test_keep_chunks_with_null_extractor(input_file: Path, output_dir: Path):
+    input_file.write_bytes(b"some text")
     config = ExtractionConfig(
         extract_root=output_dir,
         entropy_depth=0,
         handlers=(_HandlerWithNullExtractor,),
     )
-    all_reports = process_files(config, input_dir)
+    all_reports = process_file(config, input_file)
     assert list(output_dir.glob("**/*.null"))
-    assert all_reports == [], f"Unexpected error reports: {all_reports}"
+    check_result(all_reports)
diff --git a/tests/test_cli.py b/tests/test_cli.py
@@ -4,14 +4,23 @@
 
 import pytest
 from click.testing import CliRunner
-from conftest import TestHandler
 
 import unblob.cli
 from unblob.extractors import Command
 from unblob.handlers import BUILTIN_HANDLERS
+from unblob.models import Handler, HexString
 from unblob.processing import DEFAULT_DEPTH, DEFAULT_PROCESS_NUM, ExtractionConfig
 
 
+class TestHandler(Handler):
+    NAME = "test_handler"
+    PATTERNS = [HexString("21 3C")]
+    EXTRACTOR = Command("testcommand", "for", "test", "handler")
+
+    def calculate_chunk(self, *args, **kwargs):
+        pass
+
+
 class ExistingCommandHandler(TestHandler):
     EXTRACTOR = Command("sh", "something")
 
@@ -86,7 +95,7 @@ def test_help(params):
     result = runner.invoke(unblob.cli.cli, params)
     assert result.exit_code == 0
     # NOTE: In practice, it writes "Usage: unblob ...", this is done in the `cli.main` with `click.make_context`
-    assert result.output.startswith("Usage: cli [OPTIONS] FILES...")
+    assert result.output.startswith("Usage: cli [OPTIONS] FILE")
 
 
 @pytest.mark.parametrize(
@@ -118,19 +127,19 @@ def test_without_file(params: List[str]):
     runner = CliRunner()
     result = runner.invoke(unblob.cli.cli, params)
     assert result.exit_code == 2
-    assert "Missing argument 'FILES...'" in result.output
+    assert "Missing argument 'FILE'" in result.output
 
 
 def test_non_existing_file(tmp_path: Path):
     runner = CliRunner()
     path = Path("non/existing/path/54")
     result = runner.invoke(unblob.cli.cli, ["--extract-dir", str(tmp_path), str(path)])
     assert result.exit_code == 2
-    assert "Invalid value for 'FILES...'" in result.output
-    assert f"Path '{str(path)}' does not exist" in result.output
+    assert "Invalid value for 'FILE'" in result.output
+    assert f"File '{str(path)}' does not exist" in result.output
 
 
-def test_empty_dir_as_file(tmp_path: Path):
+def test_dir_for_file(tmp_path: Path):
     runner = CliRunner()
     out_path = tmp_path.joinpath("out")
     out_path.mkdir()
@@ -139,7 +148,7 @@ def test_empty_dir_as_file(tmp_path: Path):
     result = runner.invoke(
         unblob.cli.cli, ["--extract-dir", str(out_path), str(in_path)]
     )
-    assert result.exit_code == 0
+    assert result.exit_code != 0
 
 
 @pytest.mark.parametrize(
@@ -172,13 +181,14 @@ def test_archive_success(
         / "archive"
         / "zip"
         / "regular"
-        / "__input__/"
+        / "__input__"
+        / "apple.zip"
     )
-    process_files_mock = mock.MagicMock()
+    process_file_mock = mock.MagicMock()
     logger_config_mock = mock.MagicMock()
     new_params = params + ["--extract-dir", str(tmp_path), str(in_path)]
     with mock.patch.object(
-        unblob.cli, "process_files", process_files_mock
+        unblob.cli, "process_file", process_file_mock
     ), mock.patch.object(unblob.cli, "configure_logger", logger_config_mock):
         result = runner.invoke(unblob.cli.cli, new_params)
     assert result.exit_code == 0
@@ -192,7 +202,7 @@ def test_archive_success(
         process_num=expected_process_num,
         handlers=BUILTIN_HANDLERS,
     )
-    process_files_mock.assert_called_once_with(config, in_path)
+    process_file_mock.assert_called_once_with(config, in_path, None)
     logger_config_mock.assert_called_once_with(expected_verbosity, tmp_path)
 
 
@@ -214,17 +224,18 @@ def test_keep_extracted_chunks(
         / "archive"
         / "zip"
         / "regular"
-        / "__input__/"
+        / "__input__"
+        / "apple.zip"
     )
     params = args + ["--extract-dir", str(tmp_path), str(in_path)]
 
-    process_files_mock = mock.MagicMock()
-    with mock.patch.object(unblob.cli, "process_files", process_files_mock):
+    process_file_mock = mock.MagicMock()
+    with mock.patch.object(unblob.cli, "process_file", process_file_mock):
         result = runner.invoke(unblob.cli.cli, params)
 
     assert result.exit_code == 0
-    process_files_mock.assert_called_once()
+    process_file_mock.assert_called_once()
     assert (
-        process_files_mock.call_args.args[0].keep_extracted_chunks
+        process_file_mock.call_args.args[0].keep_extracted_chunks
         == keep_extracted_chunks
     ), fail_message