|
| 1 | +# |
| 2 | +# Copyright (c) nexB Inc. and others. All rights reserved. |
| 3 | +# VulnerableCode is a trademark of nexB Inc. |
| 4 | +# SPDX-License-Identifier: Apache-2.0 |
| 5 | +# See http://www.apache.org/licenses/LICENSE-2.0 for the license text. |
| 6 | +# See https://github.com/aboutcode-org/vulnerablecode for support or download. |
| 7 | +# See https://aboutcode.org for more information about nexB OSS projects. |
| 8 | +# |
| 9 | + |
| 10 | +import re |
| 11 | +from pathlib import Path |
| 12 | +from typing import Iterable |
| 13 | +from typing import List |
| 14 | + |
| 15 | +import pytz |
| 16 | +import saneyaml |
| 17 | +from dateutil import parser |
| 18 | +from fetchcode.vcs import fetch_via_vcs |
| 19 | +from packageurl import PackageURL |
| 20 | +from univers.version_constraint import VersionConstraint |
| 21 | +from univers.version_range import GitHubVersionRange |
| 22 | +from univers.version_range import GolangVersionRange |
| 23 | +from univers.versions import SemverVersion |
| 24 | + |
| 25 | +from vulnerabilities.importer import AdvisoryData |
| 26 | +from vulnerabilities.importer import AffectedPackage |
| 27 | +from vulnerabilities.importer import ReferenceV2 |
| 28 | +from vulnerabilities.pipelines import VulnerableCodeBaseImporterPipelineV2 |
| 29 | +from vulnerabilities.utils import get_advisory_url |
| 30 | +from vulnerabilities.utils import split_markdown_front_matter |
| 31 | + |
| 32 | +is_release = re.compile(r"^[\d.]+$", re.IGNORECASE).match |
| 33 | + |
| 34 | + |
| 35 | +class IstioImporterPipeline(VulnerableCodeBaseImporterPipelineV2): |
| 36 | + """ |
| 37 | + Importer for Istio.io security advisories. |
| 38 | + """ |
| 39 | + |
| 40 | + pipeline_id = "istio_importer_v2" |
| 41 | + spdx_license_expression = "Apache-2.0" |
| 42 | + license_url = "https://github.com/istio/istio.io/blob/master/LICENSE" |
| 43 | + repo_url = "git+https://github.com/istio/istio.io" |
| 44 | + unfurl_version_ranges = True |
| 45 | + |
| 46 | + @classmethod |
| 47 | + def steps(cls): |
| 48 | + return ( |
| 49 | + cls.clone, |
| 50 | + cls.collect_and_store_advisories, |
| 51 | + cls.clean_downloads, |
| 52 | + ) |
| 53 | + |
| 54 | + def advisories_count(self) -> int: |
| 55 | + base_path = Path(self.vcs_response.dest_dir) |
| 56 | + advisories_dir = base_path / "content/en/news/security" |
| 57 | + return sum( |
| 58 | + 1 for file in advisories_dir.rglob("*.md") if not file.name.endswith("_index.md") |
| 59 | + ) |
| 60 | + |
| 61 | + def clone(self): |
| 62 | + self.log(f"Cloning `{self.repo_url}`") |
| 63 | + self.vcs_response = fetch_via_vcs(self.repo_url) |
| 64 | + |
| 65 | + def collect_advisories(self) -> Iterable[AdvisoryData]: |
| 66 | + base_path = Path(self.vcs_response.dest_dir) |
| 67 | + advisories_dir = base_path / "content/en/news/security" |
| 68 | + |
| 69 | + for md_file in advisories_dir.rglob("*.md"): |
| 70 | + if md_file.name.endswith("_index.md"): |
| 71 | + continue |
| 72 | + |
| 73 | + data = self.parse_markdown(md_file) |
| 74 | + advisory_url = get_advisory_url( |
| 75 | + file=md_file, |
| 76 | + base_path=base_path, |
| 77 | + url="https://github.com/istio/istio.io/blob/master/", |
| 78 | + ) |
| 79 | + published_date = data.get("publishdate") |
| 80 | + release_date = ( |
| 81 | + parser.parse(published_date).replace(tzinfo=pytz.UTC) if published_date else None |
| 82 | + ) |
| 83 | + constraints = self.get_version_constraints(data.get("releases", [])) |
| 84 | + |
| 85 | + cves = data.get("cves", []) |
| 86 | + |
| 87 | + affected_packages = [] |
| 88 | + if constraints: |
| 89 | + affected_packages.extend( |
| 90 | + [ |
| 91 | + AffectedPackage( |
| 92 | + package=PackageURL(type="golang", namespace="istio.io", name="istio"), |
| 93 | + affected_version_range=GolangVersionRange(constraints=constraints), |
| 94 | + ), |
| 95 | + AffectedPackage( |
| 96 | + package=PackageURL(type="github", namespace="istio", name="istio"), |
| 97 | + affected_version_range=GitHubVersionRange(constraints=constraints), |
| 98 | + ), |
| 99 | + ] |
| 100 | + ) |
| 101 | + |
| 102 | + title = data.get("title") or "" |
| 103 | + summary = data.get("description") or "" |
| 104 | + references = [] |
| 105 | + if title: |
| 106 | + references.append( |
| 107 | + ReferenceV2( |
| 108 | + reference_id=title, |
| 109 | + url=f"https://istio.io/latest/news/security/{title}/", |
| 110 | + ) |
| 111 | + ) |
| 112 | + |
| 113 | + yield AdvisoryData( |
| 114 | + advisory_id=title, |
| 115 | + aliases=cves, |
| 116 | + summary=summary, |
| 117 | + affected_packages=affected_packages, |
| 118 | + references_v2=references, |
| 119 | + date_published=release_date, |
| 120 | + url=advisory_url, |
| 121 | + original_advisory_text=md_file.read_text(encoding="utf-8"), |
| 122 | + ) |
| 123 | + |
| 124 | + def parse_markdown(self, path: Path) -> dict: |
| 125 | + """Return a mapping of vulnerability data extracted from an advisory.""" |
| 126 | + text = path.read_text(encoding="utf-8") |
| 127 | + front_matter, _ = split_markdown_front_matter(text) |
| 128 | + return saneyaml.load(front_matter) |
| 129 | + |
| 130 | + def get_version_constraints(self, releases: List[str]) -> List[VersionConstraint]: |
| 131 | + constraints = [] |
| 132 | + for release in releases: |
| 133 | + release = release.strip() |
| 134 | + |
| 135 | + if "All releases prior" in release: |
| 136 | + _, _, version = release.rpartition(" ") |
| 137 | + constraints.append( |
| 138 | + VersionConstraint(version=SemverVersion(version), comparator="<") |
| 139 | + ) |
| 140 | + |
| 141 | + elif "All releases" in release and "and later" in release: |
| 142 | + version = release.replace("All releases", "").replace("and later", "").strip() |
| 143 | + if is_release(version): |
| 144 | + constraints.append( |
| 145 | + VersionConstraint(version=SemverVersion(version), comparator=">=") |
| 146 | + ) |
| 147 | + |
| 148 | + elif "to" in release: |
| 149 | + lower, _, upper = release.partition("to") |
| 150 | + constraints.append( |
| 151 | + VersionConstraint(version=SemverVersion(lower.strip()), comparator=">=") |
| 152 | + ) |
| 153 | + constraints.append( |
| 154 | + VersionConstraint(version=SemverVersion(upper.strip()), comparator="<=") |
| 155 | + ) |
| 156 | + |
| 157 | + elif is_release(release): |
| 158 | + constraints.append( |
| 159 | + VersionConstraint(version=SemverVersion(release), comparator="=") |
| 160 | + ) |
| 161 | + |
| 162 | + return constraints |
| 163 | + |
| 164 | + def clean_downloads(self): |
| 165 | + if self.vcs_response: |
| 166 | + self.log("Removing cloned repository") |
| 167 | + self.vcs_response.delete() |
| 168 | + |
| 169 | + def on_failure(self): |
| 170 | + self.clean_downloads() |
0 commit comments