Brad Bishop | 96ff198 | 2019-08-19 13:50:42 -0400 | [diff] [blame] | 1 | SUMMARY = "Updates the NVD CVE database" |
| 2 | LICENSE = "MIT" |
| 3 | |
| 4 | INHIBIT_DEFAULT_DEPS = "1" |
| 5 | |
| 6 | inherit native |
| 7 | |
| 8 | deltask do_unpack |
| 9 | deltask do_patch |
| 10 | deltask do_configure |
| 11 | deltask do_compile |
| 12 | deltask do_install |
| 13 | deltask do_populate_sysroot |
| 14 | |
| 15 | python () { |
Andrew Geissler | c9f7865 | 2020-09-18 14:11:35 -0500 | [diff] [blame^] | 16 | if not bb.data.inherits_class("cve-check", d): |
Brad Bishop | 96ff198 | 2019-08-19 13:50:42 -0400 | [diff] [blame] | 17 | raise bb.parse.SkipRecipe("Skip recipe when cve-check class is not loaded.") |
| 18 | } |
| 19 | |
Andrew Geissler | c9f7865 | 2020-09-18 14:11:35 -0500 | [diff] [blame^] | 20 | python do_fetch() { |
Brad Bishop | 96ff198 | 2019-08-19 13:50:42 -0400 | [diff] [blame] | 21 | """ |
| 22 | Update NVD database with json data feed |
| 23 | """ |
Brad Bishop | 6dbb316 | 2019-11-25 09:41:34 -0500 | [diff] [blame] | 24 | import bb.utils |
Andrew Geissler | c9f7865 | 2020-09-18 14:11:35 -0500 | [diff] [blame^] | 25 | import bb.progress |
| 26 | import sqlite3, urllib, urllib.parse, gzip |
Brad Bishop | 96ff198 | 2019-08-19 13:50:42 -0400 | [diff] [blame] | 27 | from datetime import date |
| 28 | |
Brad Bishop | 6dbb316 | 2019-11-25 09:41:34 -0500 | [diff] [blame] | 29 | bb.utils.export_proxies(d) |
| 30 | |
Andrew Geissler | 82c905d | 2020-04-13 13:39:40 -0500 | [diff] [blame] | 31 | BASE_URL = "https://nvd.nist.gov/feeds/json/cve/1.1/nvdcve-1.1-" |
Brad Bishop | 96ff198 | 2019-08-19 13:50:42 -0400 | [diff] [blame] | 32 | YEAR_START = 2002 |
| 33 | |
Brad Bishop | 6dbb316 | 2019-11-25 09:41:34 -0500 | [diff] [blame] | 34 | db_file = d.getVar("CVE_CHECK_DB_FILE") |
| 35 | db_dir = os.path.dirname(db_file) |
Andrew Geissler | c9f7865 | 2020-09-18 14:11:35 -0500 | [diff] [blame^] | 36 | |
| 37 | if os.path.exists("{0}-journal".format(db_file)): |
| 38 | # If a journal is present the last update might have been interrupted. In that case, |
| 39 | # just wipe any leftovers and force the DB to be recreated. |
| 40 | os.remove("{0}-journal".format(db_file)) |
| 41 | |
| 42 | if os.path.exists(db_file): |
| 43 | os.remove(db_file) |
Brad Bishop | 08902b0 | 2019-08-20 09:16:51 -0400 | [diff] [blame] | 44 | |
Brad Bishop | 1d80a2e | 2019-11-15 16:35:03 -0500 | [diff] [blame] | 45 | # Don't refresh the database more than once an hour |
| 46 | try: |
| 47 | import time |
| 48 | if time.time() - os.path.getmtime(db_file) < (60*60): |
Andrew Geissler | c9f7865 | 2020-09-18 14:11:35 -0500 | [diff] [blame^] | 49 | bb.debug(2, "Recently updated, skipping") |
Brad Bishop | 1d80a2e | 2019-11-15 16:35:03 -0500 | [diff] [blame] | 50 | return |
| 51 | except OSError: |
| 52 | pass |
| 53 | |
Andrew Geissler | c9f7865 | 2020-09-18 14:11:35 -0500 | [diff] [blame^] | 54 | bb.utils.mkdirhier(db_dir) |
Brad Bishop | 96ff198 | 2019-08-19 13:50:42 -0400 | [diff] [blame] | 55 | |
| 56 | # Connect to database |
| 57 | conn = sqlite3.connect(db_file) |
| 58 | c = conn.cursor() |
| 59 | |
| 60 | initialize_db(c) |
| 61 | |
Andrew Geissler | c9f7865 | 2020-09-18 14:11:35 -0500 | [diff] [blame^] | 62 | with bb.progress.ProgressHandler(d) as ph, open(os.path.join(d.getVar("TMPDIR"), 'cve_check'), 'a') as cve_f: |
| 63 | total_years = date.today().year + 1 - YEAR_START |
| 64 | for i, year in enumerate(range(YEAR_START, date.today().year + 1)): |
| 65 | bb.debug(2, "Updating %d" % year) |
| 66 | ph.update((float(i + 1) / total_years) * 100) |
| 67 | year_url = BASE_URL + str(year) |
| 68 | meta_url = year_url + ".meta" |
| 69 | json_url = year_url + ".json.gz" |
Brad Bishop | 96ff198 | 2019-08-19 13:50:42 -0400 | [diff] [blame] | 70 | |
Andrew Geissler | c9f7865 | 2020-09-18 14:11:35 -0500 | [diff] [blame^] | 71 | # Retrieve meta last modified date |
Brad Bishop | 96ff198 | 2019-08-19 13:50:42 -0400 | [diff] [blame] | 72 | try: |
Andrew Geissler | c9f7865 | 2020-09-18 14:11:35 -0500 | [diff] [blame^] | 73 | response = urllib.request.urlopen(meta_url) |
Brad Bishop | 96ff198 | 2019-08-19 13:50:42 -0400 | [diff] [blame] | 74 | except urllib.error.URLError as e: |
Andrew Geissler | c9f7865 | 2020-09-18 14:11:35 -0500 | [diff] [blame^] | 75 | cve_f.write('Warning: CVE db update error, Unable to fetch CVE data.\n\n') |
| 76 | bb.warn("Failed to fetch CVE data (%s)" % e.reason) |
Brad Bishop | 96ff198 | 2019-08-19 13:50:42 -0400 | [diff] [blame] | 77 | return |
| 78 | |
Andrew Geissler | c9f7865 | 2020-09-18 14:11:35 -0500 | [diff] [blame^] | 79 | if response: |
| 80 | for l in response.read().decode("utf-8").splitlines(): |
| 81 | key, value = l.split(":", 1) |
| 82 | if key == "lastModifiedDate": |
| 83 | last_modified = value |
| 84 | break |
| 85 | else: |
| 86 | bb.warn("Cannot parse CVE metadata, update failed") |
| 87 | return |
Brad Bishop | 96ff198 | 2019-08-19 13:50:42 -0400 | [diff] [blame] | 88 | |
Andrew Geissler | c9f7865 | 2020-09-18 14:11:35 -0500 | [diff] [blame^] | 89 | # Compare with current db last modified date |
| 90 | c.execute("select DATE from META where YEAR = ?", (year,)) |
| 91 | meta = c.fetchone() |
| 92 | if not meta or meta[0] != last_modified: |
| 93 | bb.debug(2, "Updating entries") |
| 94 | # Clear products table entries corresponding to current year |
| 95 | c.execute("delete from PRODUCTS where ID like ?", ('CVE-%d%%' % year,)) |
| 96 | |
| 97 | # Update db with current year json file |
| 98 | try: |
| 99 | response = urllib.request.urlopen(json_url) |
| 100 | if response: |
| 101 | update_db(c, gzip.decompress(response.read()).decode('utf-8')) |
| 102 | c.execute("insert or replace into META values (?, ?)", [year, last_modified]) |
| 103 | except urllib.error.URLError as e: |
| 104 | cve_f.write('Warning: CVE db update error, CVE data is outdated.\n\n') |
| 105 | bb.warn("Cannot parse CVE data (%s), update failed" % e.reason) |
| 106 | return |
| 107 | else: |
| 108 | bb.debug(2, "Already up to date (last modified %s)" % last_modified) |
| 109 | # Update success, set the date to cve_check file. |
| 110 | if year == date.today().year: |
| 111 | cve_f.write('CVE database update : %s\n\n' % date.today()) |
| 112 | |
| 113 | conn.commit() |
| 114 | conn.close() |
Brad Bishop | 96ff198 | 2019-08-19 13:50:42 -0400 | [diff] [blame] | 115 | } |
| 116 | |
Andrew Geissler | c9f7865 | 2020-09-18 14:11:35 -0500 | [diff] [blame^] | 117 | do_fetch[lockfiles] += "${CVE_CHECK_DB_FILE_LOCK}" |
| 118 | do_fetch[file-checksums] = "" |
| 119 | do_fetch[vardeps] = "" |
| 120 | |
Brad Bishop | 96ff198 | 2019-08-19 13:50:42 -0400 | [diff] [blame] | 121 | def initialize_db(c): |
| 122 | c.execute("CREATE TABLE IF NOT EXISTS META (YEAR INTEGER UNIQUE, DATE TEXT)") |
Brad Bishop | 6dbb316 | 2019-11-25 09:41:34 -0500 | [diff] [blame] | 123 | |
Brad Bishop | 96ff198 | 2019-08-19 13:50:42 -0400 | [diff] [blame] | 124 | c.execute("CREATE TABLE IF NOT EXISTS NVD (ID TEXT UNIQUE, SUMMARY TEXT, \ |
| 125 | SCOREV2 TEXT, SCOREV3 TEXT, MODIFIED INTEGER, VECTOR TEXT)") |
Brad Bishop | 6dbb316 | 2019-11-25 09:41:34 -0500 | [diff] [blame] | 126 | |
Brad Bishop | 96ff198 | 2019-08-19 13:50:42 -0400 | [diff] [blame] | 127 | c.execute("CREATE TABLE IF NOT EXISTS PRODUCTS (ID TEXT, \ |
| 128 | VENDOR TEXT, PRODUCT TEXT, VERSION_START TEXT, OPERATOR_START TEXT, \ |
| 129 | VERSION_END TEXT, OPERATOR_END TEXT)") |
Brad Bishop | 6dbb316 | 2019-11-25 09:41:34 -0500 | [diff] [blame] | 130 | c.execute("CREATE INDEX IF NOT EXISTS PRODUCT_ID_IDX on PRODUCTS(ID);") |
Brad Bishop | 96ff198 | 2019-08-19 13:50:42 -0400 | [diff] [blame] | 131 | |
| 132 | def parse_node_and_insert(c, node, cveId): |
| 133 | # Parse children node if needed |
| 134 | for child in node.get('children', ()): |
| 135 | parse_node_and_insert(c, child, cveId) |
| 136 | |
| 137 | def cpe_generator(): |
| 138 | for cpe in node.get('cpe_match', ()): |
| 139 | if not cpe['vulnerable']: |
| 140 | return |
| 141 | cpe23 = cpe['cpe23Uri'].split(':') |
| 142 | vendor = cpe23[3] |
| 143 | product = cpe23[4] |
| 144 | version = cpe23[5] |
| 145 | |
Andrew Geissler | 82c905d | 2020-04-13 13:39:40 -0500 | [diff] [blame] | 146 | if version != '*' and version != '-': |
Brad Bishop | 96ff198 | 2019-08-19 13:50:42 -0400 | [diff] [blame] | 147 | # Version is defined, this is a '=' match |
| 148 | yield [cveId, vendor, product, version, '=', '', ''] |
Andrew Geissler | 82c905d | 2020-04-13 13:39:40 -0500 | [diff] [blame] | 149 | elif version == '-': |
| 150 | # no version information is available |
| 151 | yield [cveId, vendor, product, version, '', '', ''] |
Brad Bishop | 96ff198 | 2019-08-19 13:50:42 -0400 | [diff] [blame] | 152 | else: |
| 153 | # Parse start version, end version and operators |
| 154 | op_start = '' |
| 155 | op_end = '' |
| 156 | v_start = '' |
| 157 | v_end = '' |
| 158 | |
| 159 | if 'versionStartIncluding' in cpe: |
| 160 | op_start = '>=' |
| 161 | v_start = cpe['versionStartIncluding'] |
| 162 | |
| 163 | if 'versionStartExcluding' in cpe: |
| 164 | op_start = '>' |
| 165 | v_start = cpe['versionStartExcluding'] |
| 166 | |
| 167 | if 'versionEndIncluding' in cpe: |
| 168 | op_end = '<=' |
| 169 | v_end = cpe['versionEndIncluding'] |
| 170 | |
| 171 | if 'versionEndExcluding' in cpe: |
| 172 | op_end = '<' |
| 173 | v_end = cpe['versionEndExcluding'] |
| 174 | |
| 175 | yield [cveId, vendor, product, v_start, op_start, v_end, op_end] |
| 176 | |
| 177 | c.executemany("insert into PRODUCTS values (?, ?, ?, ?, ?, ?, ?)", cpe_generator()) |
| 178 | |
| 179 | def update_db(c, jsondata): |
| 180 | import json |
| 181 | root = json.loads(jsondata) |
| 182 | |
| 183 | for elt in root['CVE_Items']: |
| 184 | if not elt['impact']: |
| 185 | continue |
| 186 | |
Andrew Geissler | 635e0e4 | 2020-08-21 15:58:33 -0500 | [diff] [blame] | 187 | accessVector = None |
Brad Bishop | 96ff198 | 2019-08-19 13:50:42 -0400 | [diff] [blame] | 188 | cveId = elt['cve']['CVE_data_meta']['ID'] |
| 189 | cveDesc = elt['cve']['description']['description_data'][0]['value'] |
| 190 | date = elt['lastModifiedDate'] |
Brad Bishop | 96ff198 | 2019-08-19 13:50:42 -0400 | [diff] [blame] | 191 | try: |
Andrew Geissler | 635e0e4 | 2020-08-21 15:58:33 -0500 | [diff] [blame] | 192 | accessVector = elt['impact']['baseMetricV2']['cvssV2']['accessVector'] |
| 193 | cvssv2 = elt['impact']['baseMetricV2']['cvssV2']['baseScore'] |
| 194 | except KeyError: |
| 195 | cvssv2 = 0.0 |
| 196 | try: |
| 197 | accessVector = accessVector or elt['impact']['baseMetricV3']['cvssV3']['attackVector'] |
Brad Bishop | 96ff198 | 2019-08-19 13:50:42 -0400 | [diff] [blame] | 198 | cvssv3 = elt['impact']['baseMetricV3']['cvssV3']['baseScore'] |
Andrew Geissler | 635e0e4 | 2020-08-21 15:58:33 -0500 | [diff] [blame] | 199 | except KeyError: |
| 200 | accessVector = accessVector or "UNKNOWN" |
Brad Bishop | 96ff198 | 2019-08-19 13:50:42 -0400 | [diff] [blame] | 201 | cvssv3 = 0.0 |
| 202 | |
| 203 | c.execute("insert or replace into NVD values (?, ?, ?, ?, ?, ?)", |
| 204 | [cveId, cveDesc, cvssv2, cvssv3, date, accessVector]) |
| 205 | |
| 206 | configurations = elt['configurations']['nodes'] |
| 207 | for config in configurations: |
| 208 | parse_node_and_insert(c, config, cveId) |
| 209 | |
| 210 | |
Andrew Geissler | c9f7865 | 2020-09-18 14:11:35 -0500 | [diff] [blame^] | 211 | do_fetch[nostamp] = "1" |
Brad Bishop | 96ff198 | 2019-08-19 13:50:42 -0400 | [diff] [blame] | 212 | |
| 213 | EXCLUDE_FROM_WORLD = "1" |