aboutsummaryrefslogtreecommitdiffhomepage
path: root/tests/cc/test_cc_maintenance_updates.py
blob: be010a25a9a48a0e436ca82a3b25fccb2dbeca6c (plain) (blame)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
import json
from collections.abc import Generator
from importlib import resources
from pathlib import Path

import pytest
import tests.data.cc.dataset

from sec_certs.dataset.cc import CCDatasetMaintenanceUpdates
from sec_certs.sample.cc_maintenance_update import CCMaintenanceUpdate


@pytest.fixture(scope="module")
def data_dir() -> Generator[Path, None, None]:
    with resources.path(tests.data.cc.dataset, "") as path:
        yield path


@pytest.fixture
def mu_dset(data_dir: Path, tmp_path_factory) -> CCDatasetMaintenanceUpdates:
    tmp_dir = tmp_path_factory.mktemp("mu_dset")
    dset = CCDatasetMaintenanceUpdates.from_json(data_dir / "auxiliary_datasets/maintenances/maintenance_updates.json")
    dset.copy_dataset(tmp_dir)
    return dset


def test_methods_not_meant_to_be_implemented():
    dset = CCDatasetMaintenanceUpdates()
    with pytest.raises(NotImplementedError):
        dset.analyze_certificates()
    with pytest.raises(NotImplementedError):
        dset._compute_heuristics_body()
    with pytest.raises(NotImplementedError):
        dset.process_auxiliary_datasets()
    with pytest.raises(NotImplementedError):
        dset.compute_related_cves()
    with pytest.raises(NotImplementedError):
        dset.get_certs_from_web()


def test_download_artifacts(mu_dset: CCDatasetMaintenanceUpdates):
    # Conversion and extraction is identical to CC, will not test.
    mu_dset.download_all_artifacts()
    mu = mu_dset["cert_8f08cacb49a742fb_update_559ed93dd80320b5"]

    if not (mu.state.report.download_ok or mu.state.st.download_ok):
        pytest.xfail(reason="Fail due to error on CC server.")

    assert mu.state.report.pdf_hash == "80bada65614c1b037c13efa78996a8910700d0e05a3ca217286f76d7dacefe62"
    assert mu.state.st.pdf_hash == "d42e4364d037ba742fcd4050a9a84d0e6300f93eb68bcfe8c61f72c429c9ceca"


def test_dataset_to_json(mu_dset: CCDatasetMaintenanceUpdates, data_dir: Path, tmp_path: Path):
    mu_dset.to_json(tmp_path / "dset.json")

    with (tmp_path / "dset.json").open("r") as handle:
        data = json.load(handle)

    with (data_dir / "auxiliary_datasets/maintenances/maintenance_updates.json").open("r") as handle:
        template_data = json.load(handle)

    del template_data["timestamp"]
    del data["timestamp"]
    del template_data["state"]["sec_certs_version"]
    del data["state"]["sec_certs_version"]
    assert data == template_data


def test_dataset_from_json(mu_dset: CCDatasetMaintenanceUpdates, data_dir: Path):
    assert mu_dset == CCDatasetMaintenanceUpdates.from_json(
        data_dir / "auxiliary_datasets/maintenances/maintenance_updates.json"
    )


def test_to_pandas(mu_dset: CCDatasetMaintenanceUpdates):
    df = mu_dset.to_pandas()
    assert df.shape == (len(mu_dset), len(CCMaintenanceUpdate.pandas_columns) - 1)
    assert df.index.name == "dgst"
    assert set(df.columns) == set(CCMaintenanceUpdate.pandas_columns) - {"dgst"}


@pytest.mark.remote
def test_from_web():
    dset = CCDatasetMaintenanceUpdates.from_web()
    assert dset is not None
    assert len(dset) >= 492  # Contents as of November 2022, maintenances should not disappear