nvidia-patch/tools/nv-driver-locator/get_nvidia_downloads.py

276 lines
7.7 KiB
Python
Raw Normal View History

#!/usr/bin/env python3
2019-08-22 12:26:36 +00:00
import sys
import urllib.request
import urllib.error
import urllib.parse
import codecs
import enum
2019-08-22 12:26:36 +00:00
import re
from bs4 import BeautifulSoup
USER_AGENT = 'Mozilla/5.0 (X11; Linux x86_64; rv:65.0) '\
'Gecko/20100101 Firefox/65.0'
2019-08-22 12:26:36 +00:00
DOWNLOAD_URL_RE = re.compile('.*download\.nvidia\.com.*', re.A | re.I)
@enum.unique
class OS(enum.Enum):
Linux_32 = 11
Linux_64 = 12
Windows7_32 = 18
Windows7_64 = 19
Windows10_32 = 56
Windows10_64 = 57
WindowsServer2012R2_32 = 32
WindowsServer2012R2_64 = 44
2019-06-09 18:45:31 +00:00
WindowsServer2016 = 74
WindowsServer2019 = 119
def __str__(self):
return self.name
def __contains__(self, e):
return e in self.__members__
@enum.unique
class CertLevel(enum.Enum):
All = ''
Beta = 0
Certified = 1
ODE = 2
QNF = 3
CRD = 4
def __str__(self):
return self.name
def __contains__(self, e):
return e in self.__members__
@enum.unique
class Product(enum.Enum):
GeForce = (107, 879)
GeForceMobile = (111, 890)
Quadro = (73, 844)
QuadroMobile = (74, 875)
2019-10-12 08:32:00 +00:00
Tesla = (110, 883)
def __str__(self):
return self.name
def __contains__(self, e):
return e in self.__members__
@enum.unique
class DriverType(enum.Enum):
Standard = 0
DCH = 1
def __str__(self):
return self.name
def __contains__(self, e):
return e in self.__members__
@enum.unique
class DriverLanguage(enum.Enum):
English = 1
def __str__(self):
return self.name
def __contains__(self, e):
return e in self.__members__
@enum.unique
class CUDAToolkitVersion(enum.Enum):
Nothing = 0
v10_0 = 20
2019-10-12 08:32:00 +00:00
v10_1 = 21
def __str__(self):
return self.name
def __contains__(self, e):
return e in self.__members__
def parse_args():
import argparse
2019-02-11 18:01:20 +00:00
def check_positive_float(val):
val = float(val)
if val <= 0:
raise ValueError("Value %s is not valid positive float" %
(repr(val),))
return val
parser = argparse.ArgumentParser(
description="Retrieves info about latest NVIDIA drivers from "
"downloads site",
formatter_class=argparse.ArgumentDefaultsHelpFormatter)
parser.add_argument("-o", "--os",
type=OS.__getitem__,
choices=list(OS),
default=OS.Linux_64,
help="OS")
parser.add_argument("-p", "--product",
type=Product.__getitem__,
choices=list(Product),
default=Product.GeForce,
help="GPU Product type")
parser.add_argument("-c", "--certification-level",
type=CertLevel.__getitem__,
choices=list(CertLevel),
default=CertLevel.All,
help="driver certification level")
parser.add_argument("-D", "--dch",
help="Query DCH driver instead of Standard driver",
default=DriverType.Standard,
const=DriverType.DCH,
action="store_const")
2019-02-11 18:01:20 +00:00
parser.add_argument("-T", "--timeout",
type=check_positive_float,
default=10.,
help="timeout for network operations")
args = parser.parse_args()
return args
2019-08-22 12:26:36 +00:00
def fetch_url(url, timeout=10):
http_req = urllib.request.Request(
url,
data=None,
headers={
'User-Agent': USER_AGENT
}
)
2019-02-11 18:01:20 +00:00
with urllib.request.urlopen(http_req, None, timeout) as resp:
coding = resp.headers.get_content_charset()
coding = coding if coding is not None else 'utf-8-sig'
decoder = codecs.getreader(coding)(resp)
res = decoder.read()
return res
2019-08-22 12:26:36 +00:00
def issue_request(query_obj, timeout=10):
ENDPOINT = 'https://www.nvidia.com/Download/processFind.aspx'
url = ENDPOINT + '?' + urllib.parse.urlencode(query_obj)
return fetch_url(url, timeout)
def parse_download_page(url):
try:
body = fetch_url(url)
soup = BeautifulSoup(body, 'html.parser')
except Exception as exc:
print('parse_download_page error: %s' % (str(exc),), file=sys.stderr)
return None
download_div = soup.find('div', id='dnldBttns')
if download_div is None:
download_div = soup.find('div', id='mainContent')
if download_div is None:
print('parse_download_page error: download div not found', file=sys.stderr)
return None
download_anchor = download_div.find('a', attrs={'href': DOWNLOAD_URL_RE})
if download_anchor is not None:
return {
'download_url': download_anchor['href']
}
return None
def parse_product_page(url):
try:
body = fetch_url(url)
soup = BeautifulSoup(body, 'html.parser')
except Exception as exc:
print('parse_product_page error: %s' % (str(exc),), file=sys.stderr)
return None
download_anchor = soup.find('a', attrs={'href': True}, id='lnkDwnldBtn')
if download_anchor is None:
return None
download_page_url = download_anchor['href']
return parse_download_page(urllib.parse.urljoin(url, download_page_url))
def get_drivers(*,
os=OS.Linux_64,
product=Product.GeForce,
certlevel=CertLevel.All,
driver_type=DriverType.Standard,
lang=DriverLanguage.English,
2019-02-11 18:01:20 +00:00
cuda_ver=CUDAToolkitVersion.Nothing,
timeout=10):
psid, pfid = product.value
query = {
'psid': psid,
'pfid': pfid,
'osid': os.value,
'lid': lang.value,
'whql': certlevel.value,
'lang': 'en-us',
'ctk': cuda_ver.value,
}
if os is OS.Windows10_64:
query['dtcid'] = driver_type.value
2019-02-11 18:01:20 +00:00
doc = issue_request(query, timeout)
soup = BeautifulSoup(doc, 'html.parser')
if soup.find(class_='contentBucketMainContent') is None:
return []
driverlistrows = list(
soup.find(class_='contentBucketMainContent')
.find_all('tr', id='driverList'))
if not driverlistrows:
return []
header = soup.find('td', class_='gridHeader').parent
def normalize_header(td):
return td.string.replace(' ', '').lower()
label_tuple = tuple(normalize_header(td) for td in header('td'))
def parse_content_td(td):
s = list(td.strings)
return max(s, key=len).strip() if s else ''
2019-08-22 12:26:36 +00:00
def parse_version(row):
return tuple(parse_content_td(row['version']).split('.'))
def normalize_product_url(url):
res = urllib.parse.urlparse(url, scheme='https', allow_fragments=False)
return urllib.parse.urlunparse(res)
labeled_rows = [dict(zip(label_tuple, tr('td'))) for tr in driverlistrows]
latest_driver_row = max(labeled_rows, key=parse_version)
obj = dict((k, parse_content_td(v)) for k, v in latest_driver_row.items())
product_td = latest_driver_row['name']
product_anchor = product_td.find('a', attrs={"href": True})
if product_anchor is not None:
product_page = normalize_product_url(product_anchor['href'])
obj['product_page'] = product_page
pp_parse_res = parse_product_page(product_page)
if pp_parse_res is not None:
obj.update(pp_parse_res)
return obj
def main():
import pprint
args = parse_args()
pprint.pprint(get_drivers(os=args.os,
product=args.product,
certlevel=args.certification_level,
2019-02-11 18:01:20 +00:00
driver_type=args.dch,
timeout=args.timeout))
if __name__ == '__main__':
main()