nvidia-patch/tools/nv-driver-locator/get_nvidia_downloads.py

#!/usr/bin/env python3

import sys
import urllib.request
import urllib.error
import urllib.parse
import codecs
import enum
import re
from bs4 import BeautifulSoup

USER_AGENT = 'Mozilla/5.0 (X11; Linux x86_64; rv:65.0) '\
             'Gecko/20100101 Firefox/65.0'
DOWNLOAD_URL_RE = re.compile('.*download\.nvidia\.com.*', re.A | re.I)


@enum.unique
class OS(enum.Enum):
    Linux_32 = 11
    Linux_64 = 12
    Windows7_32 = 18
    Windows7_64 = 19
    Windows10_32 = 56
    Windows10_64 = 57
    WindowsServer2012R2_32 = 32
    WindowsServer2012R2_64 = 44
    WindowsServer2016 = 74
    WindowsServer2019 = 119

    def __str__(self):
        return self.name

    def __contains__(self, e):
        return e in self.__members__


@enum.unique
class CertLevel(enum.Enum):
    All = ''
    Beta = 0
    Certified = 1
    ODE = 2
    QNF = 3
    CRD = 4

    def __str__(self):
        return self.name

    def __contains__(self, e):
        return e in self.__members__


@enum.unique
class Product(enum.Enum):
    GeForce = (107, 879)
    GeForceMobile = (111, 890)
    Quadro = (73, 844)
    QuadroMobile = (74, 875)
    Tesla = (110, 883)

    def __str__(self):
        return self.name

    def __contains__(self, e):
        return e in self.__members__


@enum.unique
class DriverType(enum.Enum):
    Standard = 0
    DCH = 1

    def __str__(self):
        return self.name

    def __contains__(self, e):
        return e in self.__members__


@enum.unique
class DriverLanguage(enum.Enum):
    English = 1

    def __str__(self):
        return self.name

    def __contains__(self, e):
        return e in self.__members__


@enum.unique
class CUDAToolkitVersion(enum.Enum):
    Nothing = 0
    v10_0 = 20
    v10_1 = 21

    def __str__(self):
        return self.name

    def __contains__(self, e):
        return e in self.__members__


def parse_args():
    import argparse

    def check_positive_float(val):
        val = float(val)
        if val <= 0:
            raise ValueError("Value %s is not valid positive float" %
                             (repr(val),))
        return val

    parser = argparse.ArgumentParser(
        description="Retrieves info about latest NVIDIA drivers from "
        "downloads site",
        formatter_class=argparse.ArgumentDefaultsHelpFormatter)
    parser.add_argument("-o", "--os",
                        type=OS.__getitem__,
                        choices=list(OS),
                        default=OS.Linux_64,
                        help="OS")
    parser.add_argument("-p", "--product",
                        type=Product.__getitem__,
                        choices=list(Product),
                        default=Product.GeForce,
                        help="GPU Product type")
    parser.add_argument("-c", "--certification-level",
                        type=CertLevel.__getitem__,
                        choices=list(CertLevel),
                        default=CertLevel.All,
                        help="driver certification level")
    parser.add_argument("-D", "--dch",
                        help="Query DCH driver instead of Standard driver",
                        default=DriverType.Standard,
                        const=DriverType.DCH,
                        action="store_const")
    parser.add_argument("-T", "--timeout",
                        type=check_positive_float,
                        default=10.,
                        help="timeout for network operations")
    args = parser.parse_args()
    return args


def fetch_url(url, timeout=10):
    http_req = urllib.request.Request(
        url,
        data=None,
        headers={
            'User-Agent': USER_AGENT
        }
    )
    with urllib.request.urlopen(http_req, None, timeout) as resp:
        coding = resp.headers.get_content_charset()
        coding = coding if coding is not None else 'utf-8-sig'
        decoder = codecs.getreader(coding)(resp)
        res = decoder.read()
    return res


def issue_request(query_obj, timeout=10):
    ENDPOINT = 'https://www.nvidia.com/Download/processFind.aspx'
    url = ENDPOINT + '?' + urllib.parse.urlencode(query_obj)
    return fetch_url(url, timeout)


def parse_download_page(url):
    try:
        body = fetch_url(url)
        soup = BeautifulSoup(body, 'html.parser')
    except Exception as exc:
        print('parse_download_page error: %s' % (str(exc),), file=sys.stderr)
        return None
    download_div = soup.find('div', id='dnldBttns')
    if download_div is None:
        download_div = soup.find('div', id='mainContent')
    if download_div is None:
        print('parse_download_page error: download div not found', file=sys.stderr)
        return None
    download_anchor = download_div.find('a', attrs={'href': DOWNLOAD_URL_RE})
    if download_anchor is not None:
        return {
            'download_url': download_anchor['href']
        }
    return None


def parse_product_page(url):
    try:
        body = fetch_url(url)
        soup = BeautifulSoup(body, 'html.parser')
    except Exception as exc:
        print('parse_product_page error: %s' % (str(exc),), file=sys.stderr)
        return None
    download_anchor = soup.find('a', attrs={'href': True}, id='lnkDwnldBtn')
    if download_anchor is None:
        return None
    download_page_url = download_anchor['href']
    return parse_download_page(urllib.parse.urljoin(url, download_page_url))


def get_drivers(*,
                os=OS.Linux_64,
                product=Product.GeForce,
                certlevel=CertLevel.All,
                driver_type=DriverType.Standard,
                lang=DriverLanguage.English,
                cuda_ver=CUDAToolkitVersion.Nothing,
                timeout=10):
    psid, pfid = product.value
    query = {
        'psid': psid,
        'pfid': pfid,
        'osid': os.value,
        'lid': lang.value,
        'whql': certlevel.value,
        'lang': 'en-us',
        'ctk': cuda_ver.value,
    }
    if os is OS.Windows10_64:
        query['dtcid'] = driver_type.value
    doc = issue_request(query, timeout)
    soup = BeautifulSoup(doc, 'html.parser')
    if soup.find(class_='contentBucketMainContent') is None:
        return []
    driverlistrows = list(
        soup.find(class_='contentBucketMainContent')
            .find_all('tr', id='driverList'))
    if not driverlistrows:
        return []
    header = soup.find('td', class_='gridHeader').parent

    def normalize_header(td):
        return td.string.replace(' ', '').lower()

    label_tuple = tuple(normalize_header(td) for td in header('td'))

    def parse_content_td(td):
        s = list(td.strings)
        return max(s, key=len).strip() if s else ''

    def parse_version(row):
        return tuple(parse_content_td(row['version']).split('.'))

    def normalize_product_url(url):
        res = urllib.parse.urlparse(url, scheme='https', allow_fragments=False)
        return urllib.parse.urlunparse(res)

    labeled_rows = [dict(zip(label_tuple, tr('td'))) for tr in driverlistrows]
    latest_driver_row = max(labeled_rows, key=parse_version)
    obj = dict((k, parse_content_td(v)) for k, v in latest_driver_row.items())
    product_td = latest_driver_row['name']
    product_anchor = product_td.find('a', attrs={"href": True})
    if product_anchor is not None:
        product_page = normalize_product_url(product_anchor['href'])
        obj['product_page'] = product_page
        pp_parse_res = parse_product_page(product_page)
        if pp_parse_res is not None:
            obj.update(pp_parse_res)
    return obj


def main():
    import pprint
    args = parse_args()
    pprint.pprint(get_drivers(os=args.os,
                              product=args.product,
                              certlevel=args.certification_level,
                              driver_type=args.dch,
                              timeout=args.timeout))


if __name__ == '__main__':
    main()
nv-driver-locator: implemented new NvidiaDownloadsChannel "plugin" 2019-02-10 18:22:52 +00:00			`#!/usr/bin/env python3`

ndl: gnd: add download url 2019-08-22 12:26:36 +00:00			`import sys`
nv-driver-locator: implemented new NvidiaDownloadsChannel "plugin" 2019-02-10 18:22:52 +00:00			`import urllib.request`
			`import urllib.error`
			`import urllib.parse`
			`import codecs`
			`import enum`
ndl: gnd: add download url 2019-08-22 12:26:36 +00:00			`import re`
nv-driver-locator: implemented new NvidiaDownloadsChannel "plugin" 2019-02-10 18:22:52 +00:00			`from bs4 import BeautifulSoup`

			`USER_AGENT = 'Mozilla/5.0 (X11; Linux x86_64; rv:65.0) '\`
			`'Gecko/20100101 Firefox/65.0'`
ndl: gnd: add download url 2019-08-22 12:26:36 +00:00			`DOWNLOAD_URL_RE = re.compile('.download\.nvidia\.com.', re.A \| re.I)`
nv-driver-locator: implemented new NvidiaDownloadsChannel "plugin" 2019-02-10 18:22:52 +00:00

			`@enum.unique`
			`class OS(enum.Enum):`
			`Linux_32 = 11`
			`Linux_64 = 12`
			`Windows7_32 = 18`
			`Windows7_64 = 19`
			`Windows10_32 = 56`
			`Windows10_64 = 57`
nv-driver-locator: add support for Windows Server drivers 2019-05-19 20:34:11 +00:00			`WindowsServer2012R2_32 = 32`
			`WindowsServer2012R2_64 = 44`
ndl: add WS{2016,2019} 2019-06-09 18:45:31 +00:00			`WindowsServer2016 = 74`
			`WindowsServer2019 = 119`
nv-driver-locator: implemented new NvidiaDownloadsChannel "plugin" 2019-02-10 18:22:52 +00:00
			`def __str__(self):`
			`return self.name`

			`def __contains__(self, e):`
			`return e in self.__members__`


			`@enum.unique`
			`class CertLevel(enum.Enum):`
			`All = ''`
			`Beta = 0`
			`Certified = 1`
			`ODE = 2`
			`QNF = 3`
nv-driver-locator: support for creator ready driver 2019-04-02 22:51:01 +00:00			`CRD = 4`
nv-driver-locator: implemented new NvidiaDownloadsChannel "plugin" 2019-02-10 18:22:52 +00:00
			`def __str__(self):`
			`return self.name`

			`def __contains__(self, e):`
			`return e in self.__members__`


			`@enum.unique`
			`class Product(enum.Enum):`
			`GeForce = (107, 879)`
			`GeForceMobile = (111, 890)`
			`Quadro = (73, 844)`
			`QuadroMobile = (74, 875)`
ndl: track tesla drivers as well 2019-10-12 08:32:00 +00:00			`Tesla = (110, 883)`
nv-driver-locator: implemented new NvidiaDownloadsChannel "plugin" 2019-02-10 18:22:52 +00:00
			`def __str__(self):`
			`return self.name`

			`def __contains__(self, e):`
			`return e in self.__members__`


			`@enum.unique`
			`class DriverType(enum.Enum):`
			`Standard = 0`
			`DCH = 1`

			`def __str__(self):`
			`return self.name`

			`def __contains__(self, e):`
			`return e in self.__members__`


			`@enum.unique`
			`class DriverLanguage(enum.Enum):`
			`English = 1`

			`def __str__(self):`
			`return self.name`

			`def __contains__(self, e):`
			`return e in self.__members__`


			`@enum.unique`
			`class CUDAToolkitVersion(enum.Enum):`
			`Nothing = 0`
			`v10_0 = 20`
ndl: track tesla drivers as well 2019-10-12 08:32:00 +00:00			`v10_1 = 21`
nv-driver-locator: implemented new NvidiaDownloadsChannel "plugin" 2019-02-10 18:22:52 +00:00
			`def __str__(self):`
			`return self.name`

			`def __contains__(self, e):`
			`return e in self.__members__`


			`def parse_args():`
			`import argparse`

nv-driver-locator: timeouts 2019-02-11 18:01:20 +00:00			`def check_positive_float(val):`
			`val = float(val)`
			`if val <= 0:`
			`raise ValueError("Value %s is not valid positive float" %`
			`(repr(val),))`
			`return val`

nv-driver-locator: implemented new NvidiaDownloadsChannel "plugin" 2019-02-10 18:22:52 +00:00			`parser = argparse.ArgumentParser(`
			`description="Retrieves info about latest NVIDIA drivers from "`
			`"downloads site",`
			`formatter_class=argparse.ArgumentDefaultsHelpFormatter)`
			`parser.add_argument("-o", "--os",`
			`type=OS.__getitem__,`
			`choices=list(OS),`
			`default=OS.Linux_64,`
			`help="OS")`
			`parser.add_argument("-p", "--product",`
			`type=Product.__getitem__,`
			`choices=list(Product),`
			`default=Product.GeForce,`
			`help="GPU Product type")`
			`parser.add_argument("-c", "--certification-level",`
			`type=CertLevel.__getitem__,`
			`choices=list(CertLevel),`
			`default=CertLevel.All,`
			`help="driver certification level")`
			`parser.add_argument("-D", "--dch",`
			`help="Query DCH driver instead of Standard driver",`
			`default=DriverType.Standard,`
			`const=DriverType.DCH,`
			`action="store_const")`
nv-driver-locator: timeouts 2019-02-11 18:01:20 +00:00			`parser.add_argument("-T", "--timeout",`
			`type=check_positive_float,`
			`default=10.,`
			`help="timeout for network operations")`
nv-driver-locator: implemented new NvidiaDownloadsChannel "plugin" 2019-02-10 18:22:52 +00:00			`args = parser.parse_args()`
			`return args`


ndl: gnd: add download url 2019-08-22 12:26:36 +00:00			`def fetch_url(url, timeout=10):`
nv-driver-locator: implemented new NvidiaDownloadsChannel "plugin" 2019-02-10 18:22:52 +00:00			`http_req = urllib.request.Request(`
			`url,`
			`data=None,`
			`headers={`
			`'User-Agent': USER_AGENT`
			`}`
			`)`
nv-driver-locator: timeouts 2019-02-11 18:01:20 +00:00			`with urllib.request.urlopen(http_req, None, timeout) as resp:`
nv-driver-locator: implemented new NvidiaDownloadsChannel "plugin" 2019-02-10 18:22:52 +00:00			`coding = resp.headers.get_content_charset()`
			`coding = coding if coding is not None else 'utf-8-sig'`
			`decoder = codecs.getreader(coding)(resp)`
			`res = decoder.read()`
			`return res`


ndl: gnd: add download url 2019-08-22 12:26:36 +00:00			`def issue_request(query_obj, timeout=10):`
			`ENDPOINT = 'https://www.nvidia.com/Download/processFind.aspx'`
			`url = ENDPOINT + '?' + urllib.parse.urlencode(query_obj)`
			`return fetch_url(url, timeout)`


			`def parse_download_page(url):`
			`try:`
			`body = fetch_url(url)`
			`soup = BeautifulSoup(body, 'html.parser')`
			`except Exception as exc:`
			`print('parse_download_page error: %s' % (str(exc),), file=sys.stderr)`
			`return None`
			`download_div = soup.find('div', id='dnldBttns')`
			`if download_div is None:`
			`download_div = soup.find('div', id='mainContent')`
			`if download_div is None:`
			`print('parse_download_page error: download div not found', file=sys.stderr)`
			`return None`
			`download_anchor = download_div.find('a', attrs={'href': DOWNLOAD_URL_RE})`
			`if download_anchor is not None:`
			`return {`
			`'download_url': download_anchor['href']`
			`}`
			`return None`


			`def parse_product_page(url):`
			`try:`
			`body = fetch_url(url)`
			`soup = BeautifulSoup(body, 'html.parser')`
			`except Exception as exc:`
			`print('parse_product_page error: %s' % (str(exc),), file=sys.stderr)`
			`return None`
			`download_anchor = soup.find('a', attrs={'href': True}, id='lnkDwnldBtn')`
			`if download_anchor is None:`
			`return None`
			`download_page_url = download_anchor['href']`
			`return parse_download_page(urllib.parse.urljoin(url, download_page_url))`


nv-driver-locator: implemented new NvidiaDownloadsChannel "plugin" 2019-02-10 18:22:52 +00:00			`def get_drivers(*,`
			`os=OS.Linux_64,`
			`product=Product.GeForce,`
			`certlevel=CertLevel.All,`
			`driver_type=DriverType.Standard,`
			`lang=DriverLanguage.English,`
nv-driver-locator: timeouts 2019-02-11 18:01:20 +00:00			`cuda_ver=CUDAToolkitVersion.Nothing,`
			`timeout=10):`
nv-driver-locator: implemented new NvidiaDownloadsChannel "plugin" 2019-02-10 18:22:52 +00:00			`psid, pfid = product.value`
			`query = {`
			`'psid': psid,`
			`'pfid': pfid,`
			`'osid': os.value,`
			`'lid': lang.value,`
			`'whql': certlevel.value,`
			`'lang': 'en-us',`
			`'ctk': cuda_ver.value,`
			`}`
			`if os is OS.Windows10_64:`
			`query['dtcid'] = driver_type.value`
nv-driver-locator: timeouts 2019-02-11 18:01:20 +00:00			`doc = issue_request(query, timeout)`
nv-driver-locator: implemented new NvidiaDownloadsChannel "plugin" 2019-02-10 18:22:52 +00:00			`soup = BeautifulSoup(doc, 'html.parser')`
			`if soup.find(class_='contentBucketMainContent') is None:`
			`return []`
			`driverlistrows = list(`
			`soup.find(class_='contentBucketMainContent')`
			`.find_all('tr', id='driverList'))`
			`if not driverlistrows:`
			`return []`
			`header = soup.find('td', class_='gridHeader').parent`

			`def normalize_header(td):`
			`return td.string.replace(' ', '').lower()`

			`label_tuple = tuple(normalize_header(td) for td in header('td'))`

			`def parse_content_td(td):`
			`s = list(td.strings)`
			`return max(s, key=len).strip() if s else ''`

ndl: gnd: add download url 2019-08-22 12:26:36 +00:00			`def parse_version(row):`
			`return tuple(parse_content_td(row['version']).split('.'))`

			`def normalize_product_url(url):`
			`res = urllib.parse.urlparse(url, scheme='https', allow_fragments=False)`
			`return urllib.parse.urlunparse(res)`

			`labeled_rows = [dict(zip(label_tuple, tr('td'))) for tr in driverlistrows]`
			`latest_driver_row = max(labeled_rows, key=parse_version)`
			`obj = dict((k, parse_content_td(v)) for k, v in latest_driver_row.items())`
			`product_td = latest_driver_row['name']`
			`product_anchor = product_td.find('a', attrs={"href": True})`
			`if product_anchor is not None:`
			`product_page = normalize_product_url(product_anchor['href'])`
			`obj['product_page'] = product_page`
			`pp_parse_res = parse_product_page(product_page)`
			`if pp_parse_res is not None:`
			`obj.update(pp_parse_res)`
			`return obj`
nv-driver-locator: implemented new NvidiaDownloadsChannel "plugin" 2019-02-10 18:22:52 +00:00

			`def main():`
			`import pprint`
			`args = parse_args()`
			`pprint.pprint(get_drivers(os=args.os,`
			`product=args.product,`
			`certlevel=args.certification_level,`
nv-driver-locator: timeouts 2019-02-11 18:01:20 +00:00			`driver_type=args.dch,`
			`timeout=args.timeout))`
nv-driver-locator: implemented new NvidiaDownloadsChannel "plugin" 2019-02-10 18:22:52 +00:00

			`if __name__ == '__main__':`
			`main()`