Completed
Push — master ( f346bf...683ddf )
by John
03:21
created

ptcrb_scraper()   B

Complexity

Conditions 4

Size

Total Lines 23

Duplication

Lines 0
Ratio 0 %

Code Coverage

Tests 15
CRAP Score 4

Importance

Changes 2
Bugs 1 Features 1
Metric Value
cc 4
c 2
b 1
f 1
dl 0
loc 23
ccs 15
cts 15
cp 1
crap 4
rs 8.7972
1
#!/usr/bin/env python3
2 5
"""This module is used for network connections; APIs, downloading, etc."""
3
4 5
import os  # filesystem read
5 5
try:
6 5
    from defusedxml import ElementTree  # safer XML parsing
7
except (ImportError, AttributeError):
8
    from xml.etree import ElementTree  # XML parsing
9 5
import re  # regexes
10 5
import concurrent.futures  # multiprocessing/threading
11 5
import glob  # pem file lookup
12 5
import requests  # downloading
13 5
from bs4 import BeautifulSoup  # scraping
14 5
from bbarchivist import utilities  # parse filesize
15 5
from bbarchivist.bbconstants import SERVERS  # lookup servers
16
17 5
__author__ = "Thurask"
18 5
__license__ = "WTFPL v2"
19 5
__copyright__ = "2015-2017 Thurask"
20
21
22 5
def grab_pem():
23
    """
24
    Work with either local cacerts or system cacerts.
25
    """
26 5
    try:
27 5
        pemfile = glob.glob(os.path.join(os.getcwd(), "cacert.pem"))[0]
28 5
    except IndexError:
29 5
        return requests.certs.where()  # no local cacerts
30
    else:
31 5
        return os.path.abspath(pemfile)  # local cacerts
32
33
34 5
def pem_wrapper(method):
35
    """
36
    Decorator to set REQUESTS_CA_BUNDLE.
37
38
    :param method: Method to use.
39
    :type method: function
40
    """
41 5
    def wrapper(*args, **kwargs):
42
        """
43
        Set REQUESTS_CA_BUNDLE before doing function.
44
        """
45 5
        os.environ["REQUESTS_CA_BUNDLE"] = grab_pem()
46 5
        return method(*args, **kwargs)
47 5
    return wrapper
48
49
50 5
def generic_soup_parser(url, session=None):
51
    """
52
    Get a BeautifulSoup HTML parser for some URL.
53
54
    :param url: The URL to check.
55
    :type url: str
56
57
    :param session: Requests session object, default is created on the fly.
58
    :type session: requests.Session()
59
    """
60 5
    session = requests.Session() if session is None else session
61 5
    req = session.get(url)
62 5
    soup = BeautifulSoup(req.content, "html.parser")
63 5
    return soup
64
65
66 5
@pem_wrapper
67 5
def get_length(url, session=None):
68
    """
69
    Get content-length header from some URL.
70
71
    :param url: The URL to check.
72
    :type url: str
73
74
    :param session: Requests session object, default is created on the fly.
75
    :type session: requests.Session()
76
    """
77 5
    session = requests.Session() if session is None else session
78 5
    if url is None:
79 5
        return 0
80 5
    try:
81 5
        heads = session.head(url)
82 5
        fsize = heads.headers['content-length']
83 5
        return int(fsize)
84 5
    except requests.ConnectionError:
85 5
        return 0
86
87
88 5
@pem_wrapper
89 5
def download(url, output_directory=None, session=None):
90
    """
91
    Download file from given URL.
92
93
    :param url: URL to download from.
94
    :type url: str
95
96
    :param output_directory: Download folder. Default is local.
97
    :type output_directory: str
98
99
    :param session: Requests session object, default is created on the fly.
100
    :type session: requests.Session()
101
    """
102 5
    session = requests.Session() if session is None else session
103 5
    output_directory = os.getcwd() if output_directory is None else output_directory
104 5
    lfname = url.split('/')[-1]
105 5
    sname = utilities.stripper(lfname)
106 5
    fname = os.path.join(output_directory, lfname)
107 5
    download_writer(url, fname, lfname, sname, session)
108 5
    remove_empty_download(fname)
109
110
111 5
def remove_empty_download(fname):
112
    """
113
    Remove file if it's empty.
114
115
    :param fname: File path.
116
    :type fname: str
117
    """
118 5
    if os.stat(fname).st_size == 0:
119 5
        os.remove(fname)
120
121
122 5
def download_writer(url, fname, lfname, sname, session=None):
123
    """
124
    Download file and write to disk.
125
126
    :param url: URL to download from.
127
    :type url: str
128
129
    :param fname: File path.
130
    :type fname: str
131
132
    :param lfname: Long filename.
133
    :type lfname: str
134
135
    :param sname: Short name, for printing to screen.
136
    :type sname: str
137
138
    :param session: Requests session object, default is created on the fly.
139
    :type session: requests.Session()
140
    """
141 5
    with open(fname, "wb") as file:
142 5
        req = session.get(url, stream=True)
143 5
        clength = req.headers['content-length']
144 5
        fsize = utilities.fsizer(clength)
145 5
        if req.status_code == 200:  # 200 OK
146 5
            print("DOWNLOADING {0} [{1}]".format(sname, fsize))
147 5
            for chunk in req.iter_content(chunk_size=1024):
148 5
                file.write(chunk)
149
        else:
150 5
            print("ERROR: HTTP {0} IN {1}".format(req.status_code, lfname))
151
152
153 5
def download_bootstrap(urls, outdir=None, workers=5, session=None):
154
    """
155
    Run downloaders for each file in given URL iterable.
156
157
    :param urls: URLs to download.
158
    :type urls: list
159
160
    :param outdir: Download folder. Default is handled in :func:`download`.
161
    :type outdir: str
162
163
    :param workers: Number of worker processes. Default is 5.
164
    :type workers: int
165
166
    :param session: Requests session object, default is created on the fly.
167
    :type session: requests.Session()
168
    """
169 5
    workers = len(urls) if len(urls) < workers else workers
170 5
    spinman = utilities.SpinManager()
171 5
    with concurrent.futures.ThreadPoolExecutor(max_workers=workers) as xec:
172 5
        try:
173 5
            spinman.start()
174 5
            for url in urls:
175 5
                xec.submit(download, url, outdir, session)
176
        except (KeyboardInterrupt, SystemExit):
177
            xec.shutdown()
178
            spinman.stop()
179 5
    spinman.stop()
180 5
    utilities.spinner_clear()
181 5
    utilities.line_begin()
182
183
184 5
@pem_wrapper
185 5
def availability(url, session=None):
186
    """
187
    Check HTTP status code of given URL.
188
    200 or 301-308 is OK, else is not.
189
190
    :param url: URL to check.
191
    :type url: str
192
193
    :param session: Requests session object, default is created on the fly.
194
    :type session: requests.Session()
195
    """
196 5
    session = requests.Session() if session is None else session
197 5
    try:
198 5
        avlty = session.head(url)
199 5
        status = int(avlty.status_code)
200 5
        return status == 200 or 300 < status <= 308
201 5
    except requests.ConnectionError:
202 5
        return False
203
204
205 5
def clean_availability(results, server):
206
    """
207
    Clean availability for autolookup script.
208
209
    :param results: Result dict.
210
    :type results: dict(str: str)
211
212
    :param server: Server, key for result dict.
213
    :type server: str
214
    """
215 5
    marker = "PD" if server == "p" else server.upper()
216 5
    rel = results[server.lower()]
217 5
    avail = marker if rel != "SR not in system" and rel is not None else "  "
218 5
    return rel, avail
219
220
221 5
@pem_wrapper
222 5
def carrier_checker(mcc, mnc, session=None):
223
    """
224
    Query BlackBerry World to map a MCC and a MNC to a country and carrier.
225
226
    :param mcc: Country code.
227
    :type mcc: int
228
229
    :param mnc: Network code.
230
    :type mnc: int
231
232
    :param session: Requests session object, default is created on the fly.
233
    :type session: requests.Session()
234
    """
235 5
    session = requests.Session() if session is None else session
236 5
    url = "http://appworld.blackberry.com/ClientAPI/checkcarrier?homemcc={0}&homemnc={1}&devicevendorid=-1&pin=0".format(
237
        mcc, mnc)
238 5
    user_agent = {'User-agent': 'AppWorld/5.1.0.60'}
239 5
    req = session.get(url, headers=user_agent)
240 5
    root = ElementTree.fromstring(req.text)
241 5
    for child in root:
242 5
        if child.tag == "country":
243 5
            country = child.get("name")
244 5
        if child.tag == "carrier":
245 5
            carrier = child.get("name")
246 5
    return country, carrier
247
248
249 5
def return_npc(mcc, mnc):
250
    """
251
    Format MCC and MNC into a NPC.
252
253
    :param mcc: Country code.
254
    :type mcc: int
255
256
    :param mnc: Network code.
257
    :type mnc: int
258
    """
259 5
    return "{0}{1}30".format(str(mcc).zfill(3), str(mnc).zfill(3))
260
261
262 5
@pem_wrapper
263 5
def carrier_query(npc, device, upgrade=False, blitz=False, forced=None, session=None):
264
    """
265
    Query BlackBerry servers, check which update is out for a carrier.
266
267
    :param npc: MCC + MNC (see `func:return_npc`)
268
    :type npc: int
269
270
    :param device: Hexadecimal hardware ID.
271
    :type device: str
272
273
    :param upgrade: Whether to use upgrade files. False by default.
274
    :type upgrade: bool
275
276
    :param blitz: Whether or not to create a blitz package. False by default.
277
    :type blitz: bool
278
279
    :param forced: Force a software release.
280
    :type forced: str
281
282
    :param session: Requests session object, default is created on the fly.
283
    :type session: requests.Session()
284
    """
285 5
    session = requests.Session() if session is None else session
286 5
    upg = "upgrade" if upgrade else "repair"
287 5
    forced = "latest" if forced is None else forced
288 5
    url = "https://cs.sl.blackberry.com/cse/updateDetails/2.2/"
289 5
    query = '<?xml version="1.0" encoding="UTF-8"?>'
290 5
    query += '<updateDetailRequest version="2.2.1" authEchoTS="1366644680359">'
291 5
    query += "<clientProperties>"
292 5
    query += "<hardware>"
293 5
    query += "<pin>0x2FFFFFB3</pin><bsn>1128121361</bsn>"
294 5
    query += "<imei>004401139269240</imei>"
295 5
    query += "<id>0x{0}</id>".format(device)
296 5
    query += "</hardware>"
297 5
    query += "<network>"
298 5
    query += "<homeNPC>0x{0}</homeNPC>".format(npc)
299 5
    query += "<iccid>89014104255505565333</iccid>"
300 5
    query += "</network>"
301 5
    query += "<software>"
302 5
    query += "<currentLocale>en_US</currentLocale>"
303 5
    query += "<legalLocale>en_US</legalLocale>"
304 5
    query += "</software>"
305 5
    query += "</clientProperties>"
306 5
    query += "<updateDirectives>"
307 5
    query += '<allowPatching type="REDBEND">true</allowPatching>'
308 5
    query += "<upgradeMode>{0}</upgradeMode>".format(upg)
309 5
    query += "<provideDescriptions>false</provideDescriptions>"
310 5
    query += "<provideFiles>true</provideFiles>"
311 5
    query += "<queryType>NOTIFICATION_CHECK</queryType>"
312 5
    query += "</updateDirectives>"
313 5
    query += "<pollType>manual</pollType>"
314 5
    query += "<resultPackageSetCriteria>"
315 5
    query += '<softwareRelease softwareReleaseVersion="{0}" />'.format(forced)
316 5
    query += "<releaseIndependent>"
317 5
    query += '<packageType operation="include">application</packageType>'
318 5
    query += "</releaseIndependent>"
319 5
    query += "</resultPackageSetCriteria>"
320 5
    query += "</updateDetailRequest>"
321 5
    header = {"Content-Type": "text/xml;charset=UTF-8"}
322 5
    req = session.post(url, headers=header, data=query)
323 5
    return parse_carrier_xml(req.text, blitz)
324
325
326 5
def carrier_swver_get(root):
327
    """
328
    Get software release from carrier XML.
329
330
    :param root: ElementTree we're barking up.
331
    :type root: xml.etree.ElementTree.ElementTree
332
    """
333 5
    for child in root.iter("softwareReleaseMetadata"):
334 5
        swver = child.get("softwareReleaseVersion")
335 5
    return swver
336
337
338 5
def carrier_child_fileappend(child, files, baseurl, blitz=False):
339
    """
340
    Append bar file links to a list from a child element.
341
342
    :param child: Child element in use.
343
    :type child: xml.etree.ElementTree.Element
344
345
    :param files: Filelist.
346
    :type files: list(str)
347
348
    :param baseurl: Base URL, URL minus the filename.
349
    :type baseurl: str
350
351
    :param blitz: Whether or not to create a blitz package. False by default.
352
    :type blitz: bool
353
    """
354 5
    if not blitz:
355 5
        files.append(baseurl + child.get("path"))
356
    else:
357 5
        if child.get("type") not in ["system:radio", "system:desktop", "system:os"]:
358 5
            files.append(baseurl + child.get("path"))
359 5
    return files
360
361
362 5
def carrier_child_finder(root, files, baseurl, blitz=False):
363
    """
364
    Extract filenames, radio and OS from child elements.
365
366
    :param root: ElementTree we're barking up.
367
    :type root: xml.etree.ElementTree.ElementTree
368
369
    :param files: Filelist.
370
    :type files: list(str)
371
372
    :param baseurl: Base URL, URL minus the filename.
373
    :type baseurl: str
374
375
    :param blitz: Whether or not to create a blitz package. False by default.
376
    :type blitz: bool
377
    """
378 5
    osver = radver = ""
379 5
    for child in root.iter("package"):
380 5
        files = carrier_child_fileappend(child, files, baseurl, blitz)
381 5
        if child.get("type") == "system:radio":
382 5
            radver = child.get("version")
383 5
        elif child.get("type") == "system:desktop":
384 5
            osver = child.get("version")
385 5
        elif child.get("type") == "system:os":
386 5
            osver = child.get("version")
387 5
    return osver, radver, files
388
389
390 5
def parse_carrier_xml(data, blitz=False):
391
    """
392
    Parse the response to a carrier update request and return the juicy bits.
393
394
    :param data: The data to parse.
395
    :type data: xml
396
397
    :param blitz: Whether or not to create a blitz package. False by default.
398
    :type blitz: bool
399
    """
400 5
    root = ElementTree.fromstring(data)
401 5
    sw_exists = root.find('./data/content/softwareReleaseMetadata')
402 5
    swver = "N/A" if sw_exists is None else ""
403 5
    if sw_exists is not None:
404 5
        swver = carrier_swver_get(root)
405 5
    files = []
406 5
    package_exists = root.find('./data/content/fileSets/fileSet')
407 5
    osver = radver = ""
408 5
    if package_exists is not None:
409 5
        baseurl = "{0}/".format(package_exists.get("url"))
410 5
        osver, radver, files = carrier_child_finder(root, files, baseurl, blitz)
411 5
    return(swver, osver, radver, files)
412
413
414 5
@pem_wrapper
415 5
def sr_lookup(osver, server, session=None):
416
    """
417
    Software release lookup, with choice of server.
418
    :data:`bbarchivist.bbconstants.SERVERLIST` for server list.
419
420
    :param osver: OS version to lookup, 10.x.y.zzzz.
421
    :type osver: str
422
423
    :param server: Server to use.
424
    :type server: str
425
426
    :param session: Requests session object, default is created on the fly.
427
    :type session: requests.Session()
428
    """
429 5
    session = requests.Session() if session is None else session
430 5
    reg = re.compile(r"(\d{1,4}\.)(\d{1,4}\.)(\d{1,4}\.)(\d{1,4})")
431 5
    query = '<?xml version="1.0" encoding="UTF-8"?>'
432 5
    query += '<srVersionLookupRequest version="2.0.0"'
433 5
    query += ' authEchoTS="1366644680359">'
434 5
    query += '<clientProperties><hardware>'
435 5
    query += '<pin>0x2FFFFFB3</pin><bsn>1140011878</bsn>'
436 5
    query += '<imei>004402242176786</imei><id>0x8D00240A</id>'
437 5
    query += '<isBootROMSecure>true</isBootROMSecure>'
438 5
    query += '</hardware>'
439 5
    query += '<network>'
440 5
    query += '<vendorId>0x0</vendorId><homeNPC>0x60</homeNPC>'
441 5
    query += '<currentNPC>0x60</currentNPC><ecid>0x1</ecid>'
442 5
    query += '</network>'
443 5
    query += '<software><currentLocale>en_US</currentLocale>'
444 5
    query += '<legalLocale>en_US</legalLocale>'
445 5
    query += '<osVersion>{0}</osVersion>'.format(osver)
446 5
    query += '<omadmEnabled>false</omadmEnabled>'
447 5
    query += '</software></clientProperties>'
448 5
    query += '</srVersionLookupRequest>'
449 5
    header = {"Content-Type": "text/xml;charset=UTF-8"}
450 5
    try:
451 5
        req = session.post(server, headers=header, data=query, timeout=1)
452 5
    except (requests.exceptions.Timeout, requests.exceptions.ConnectionError):
453 5
        return "SR not in system"
454 5
    try:
455 5
        root = ElementTree.fromstring(req.text)
456 5
    except ElementTree.ParseError:
457 5
        return "SR not in system"
458
    else:
459 5
        packages = root.findall('./data/content/')
460 5
        for package in packages:
461 5
            if package.text is not None:
462 5
                match = reg.match(package.text)
463 5
                if match:
464 5
                    return package.text
465
                else:
466 5
                    return "SR not in system"
467
468
469 5
def sr_lookup_bootstrap(osv, session=None, no2=False):
470
    """
471
    Run lookups for each server for given OS.
472
473
    :param osv: OS to check.
474
    :type osv: str
475
476
    :param session: Requests session object, default is created on the fly.
477
    :type session: requests.Session()
478
479
    :param no2: Whether to skip Alpha2/Beta2 servers. Default is false.
480
    :type no2: bool
481
    """
482 5
    with concurrent.futures.ThreadPoolExecutor(max_workers=5) as xec:
483 5
        try:
484 5
            results = {
485
                "p": None,
486
                "a1": None,
487
                "a2": None,
488
                "b1": None,
489
                "b2": None
490
            }
491 5
            if no2:
492 5
                del results["a2"]
493 5
                del results["b2"]
494 5
            for key in results:
495 5
                results[key] = xec.submit(sr_lookup, osv, SERVERS[key], session).result()
496 5
            return results
497
        except KeyboardInterrupt:
498
            xec.shutdown(wait=False)
499
500
501 5
@pem_wrapper
502 5
def available_bundle_lookup(mcc, mnc, device, session=None):
503
    """
504
    Check which software releases were ever released for a carrier.
505
506
    :param mcc: Country code.
507
    :type mcc: int
508
509
    :param mnc: Network code.
510
    :type mnc: int
511
512
    :param device: Hexadecimal hardware ID.
513
    :type device: str
514
515
    :param session: Requests session object, default is created on the fly.
516
    :type session: requests.Session()
517
    """
518 5
    session = requests.Session() if session is None else session
519 5
    server = "https://cs.sl.blackberry.com/cse/availableBundles/1.0.0/"
520 5
    npc = return_npc(mcc, mnc)
521 5
    query = '<?xml version="1.0" encoding="UTF-8"?>'
522 5
    query += '<availableBundlesRequest version="1.0.0" '
523 5
    query += 'authEchoTS="1366644680359">'
524 5
    query += '<deviceId><pin>0x2FFFFFB3</pin></deviceId>'
525 5
    query += '<clientProperties><hardware><id>0x{0}</id>'.format(device)
526 5
    query += '<isBootROMSecure>true</isBootROMSecure></hardware>'
527 5
    query += '<network><vendorId>0x0</vendorId><homeNPC>0x{0}</homeNPC>'.format(npc)
528 5
    query += '<currentNPC>0x{0}</currentNPC></network><software>'.format(npc)
529 5
    query += '<currentLocale>en_US</currentLocale>'
530 5
    query += '<legalLocale>en_US</legalLocale>'
531 5
    query += '<osVersion>10.0.0.0</osVersion>'
532 5
    query += '<radioVersion>10.0.0.0</radioVersion></software>'
533 5
    query += '</clientProperties><updateDirectives><bundleVersionFilter>'
534 5
    query += '</bundleVersionFilter></updateDirectives>'
535 5
    query += '</availableBundlesRequest>'
536 5
    header = {"Content-Type": "text/xml;charset=UTF-8"}
537 5
    req = session.post(server, headers=header, data=query)
538 5
    root = ElementTree.fromstring(req.text)
539 5
    package = root.find('./data/content')
540 5
    bundlelist = [child.attrib["version"] for child in package]
541 5
    return bundlelist
542
543
544 5
@pem_wrapper
545
def ptcrb_scraper(ptcrbid):
546
    """
547
    Get the PTCRB results for a given device.
548
549
    :param ptcrbid: Numerical ID from PTCRB (end of URL).
550
    :type ptcrbid: str
551
    """
552 5
    baseurl = "https://ptcrb.com/vendor/complete/view_complete_request_guest.cfm?modelid={0}".format(
553
        ptcrbid)
554 5
    sess = requests.Session()
555 5
    sess.headers.update({"Referer": "https://ptcrb.com/vendor/complete/complete_request.cfm"})
556 5
    soup = generic_soup_parser(baseurl, sess)
557 5
    text = soup.get_text()
558 5
    text = text.replace("\r\n", " ")
559 5
    prelimlist = re.findall("OS .+[^\\n]", text, re.IGNORECASE)
560 5
    if not prelimlist:  # Priv
561 5
        prelimlist = re.findall(r"[A-Z]{3}[0-9]{3}[\s]", text)
562 5
    cleanlist = []
563 5
    for item in prelimlist:
564 5
        if not item.endswith("\r\n"):  # they should hire QC people...
565 5
            cleanlist.append(ptcrb_item_cleaner(item))
566 5
    return cleanlist
567
568
569 5
def space_pad(instring, minlength):
570
    """
571
    Pad a string with spaces until it's the minimum length.
572
573
    :param instring: String to pad.
574
    :type instring: str
575
576
    :param minlength: Pad while len(instring) < minlength.
577
    :type minlength: int
578
    """
579 5
    while len(instring) < minlength:
580 5
        instring += " "
581 5
    return instring
582
583
584 5
def ptcrb_item_cleaner(item):
585
    """
586
    Cleanup poorly formatted PTCRB entries written by an intern.
587
588
    :param item: The item to clean.
589
    :type item: str
590
    """
591 5
    item = item.replace("<td>", "")
592 5
    item = item.replace("</td>", "")
593 5
    item = item.replace("\n", "")
594 5
    item = item.replace(" (SR", ", SR")
595 5
    item = re.sub(r"\s?\((.*)$", "", item)
596 5
    item = re.sub(r"\sSV.*$", "", item)
597 5
    item = item.replace(")", "")
598 5
    item = item.replace(". ", ".")
599 5
    item = item.replace(";", "")
600 5
    item = item.replace("version", "Version")
601 5
    item = item.replace("Verison", "Version")
602 5
    if item.count("OS") > 1:
603 5
        templist = item.split("OS")
604 5
        templist[0] = "OS"
605 5
        item = "".join([templist[0], templist[1]])
606 5
    item = item.replace("SR", "SW Release")
607 5
    item = item.replace(" Version:", ":")
608 5
    item = item.replace("Version ", " ")
609 5
    item = item.replace(":1", ": 1")
610 5
    item = item.replace(", ", " ")
611 5
    item = item.replace("Software", "SW")
612 5
    item = item.replace("  ", " ")
613 5
    item = item.replace("OS ", "OS: ")
614 5
    item = item.replace("Radio ", "Radio: ")
615 5
    item = item.replace("Release ", "Release: ")
616 5
    spaclist = item.split(" ")
617 5
    if len(spaclist) > 1:
618 5
        spaclist[1] = space_pad(spaclist[1], 11)
619 5
        spaclist[3] = space_pad(spaclist[3], 11)
620
    else:
621 5
        spaclist.insert(0, "OS:")
622 5
    item = " ".join(spaclist)
623 5
    item = item.strip()
624 5
    return item
625
626
627 5
@pem_wrapper
628 5
def kernel_scraper(utils=False):
629
    """
630
    Scrape BlackBerry's GitHub kernel repo for available branches.
631
632
    :param utils: Check android-utils repo instead of android-linux-kernel. Default is False.
633
    :type utils: bool
634
    """
635 5
    repo = "android-utils" if utils else "android-linux-kernel"
636 5
    kernlist = []
637 5
    sess = requests.Session()
638 5
    for page in range(1, 10):
639 5
        url = "https://github.com/blackberry/{0}/branches/all?page={1}".format(repo, page)
640 5
        soup = generic_soup_parser(url, sess)
641 5
        if soup.find("div", {"class": "no-results-message"}):
642 5
            break
643
        else:
644 5
            text = soup.get_text()
645 5
            kernlist.extend(re.findall(r"msm[0-9]{4}\/[A-Z0-9]{6}", text, re.IGNORECASE))
646 5
    return kernlist
647
648
649 5
def root_generator(folder, build, variant="common"):
650
    """
651
    Generate roots for the SHAxxx hash lookup URLs.
652
653
    :param folder: Dictionary of variant: loader name pairs.
654
    :type folder: dict(str: str)
655
656
    :param build: Build to check, 3 letters + 3 numbers.
657
    :type build: str
658
659
    :param variant: Autoloader variant. Default is "common".
660
    :type variant: str
661
    """
662
    #Priv specific
663 5
    privx = "bbfoundation/hashfiles_priv/{0}".format(folder[variant])
664
    #DTEK50 specific
665 5
    dtek50x = "bbSupport/DTEK50" if build[:3] == "AAF" else "bbfoundation/hashfiles_priv/dtek50"
666
    #DTEK60 specific
667 5
    dtek60x = dtek50x  # still uses dtek50 folder, for some reason
668
    #Pack it up
669 5
    roots = {"Priv": privx, "DTEK50": dtek50x, "DTEK60": dtek60x}
670 5
    return roots
671
672
673 5
def make_droid_skeleton(method, build, device, variant="common"):
674
    """
675
    Make an Android autoloader/hash URL.
676
677
    :param method: None for regular OS links, "sha256/512" for SHA256 or 512 hash.
678
    :type method: str
679
680
    :param build: Build to check, 3 letters + 3 numbers.
681
    :type build: str
682
683
    :param device: Device to check.
684
    :type device: str
685
686
    :param variant: Autoloader variant. Default is "common".
687
    :type variant: str
688
    """
689 5
    folder = {"vzw-vzw": "verizon", "na-att": "att", "na-tmo": "tmo", "common": "default"}
690 5
    devices = {"Priv": "qc8992", "DTEK50": "qc8952_64_sfi", "DTEK60": "qc8996"}
691 5
    roots = root_generator(folder, build, variant)
692 5
    base = "bbry_{2}_autoloader_user-{0}-{1}".format(variant, build.upper(), devices[device])
693 5
    if method is None:
694 5
        skel = "https://bbapps.download.blackberry.com/Priv/{0}.zip".format(base)
695
    else:
696 5
        skel = "http://ca.blackberry.com/content/dam/{1}/{0}.{2}sum".format(base, roots[device], method.lower())
697 5
    return skel
698
699
700 5
def bulk_droid_skeletons(devs, build, method=None):
701
    """
702
    Prepare list of Android autoloader/hash URLs.
703
704
    :param devs: List of devices.
705
    :type devs: list(str)
706
707
    :param build: Build to check, 3 letters + 3 numbers.
708
    :type build: str
709
710
    :param method: None for regular OS links, "sha256/512" for SHA256 or 512 hash.
711
    :type method: str
712
    """
713 5
    carrier_variants = ("common", "vzw-vzw", "na-tmo", "na-att")  # device variants
714 5
    common_variants = ("common", )  # no Americans
715 5
    carrier_devices = ("Priv", )  # may this list never expand in the future
716 5
    skels = []
717 5
    for dev in devs:
718 5
        varlist = carrier_variants if dev in carrier_devices else common_variants
719 5
        for var in varlist:
720 5
            skel = make_droid_skeleton(method, build, dev, var)
721 5
            skels.append(skel)
722 5
    return skels
723
724
725 5
def prepare_droid_list(device):
726
    """
727
    Convert single devices to a list, if necessary.
728
729
    :param device: Device to check.
730
    :type device: str
731
    """
732 5
    if isinstance(device, list):
733 5
        devs = device
734
    else:
735 5
        devs = [device]
736 5
    return devs
737
738
739 5
def droid_scanner(build, device, method=None, session=None):
740
    """
741
    Check for Android autoloaders on BlackBerry's site.
742
743
    :param build: Build to check, 3 letters + 3 numbers.
744
    :type build: str
745
746
    :param device: Device to check.
747
    :type device: str
748
749
    :param method: None for regular OS links, "sha256/512" for SHA256 or 512 hash.
750
    :type method: str
751
752
    :param session: Requests session object, default is created on the fly.
753
    :type session: requests.Session()
754
    """
755 5
    devs = prepare_droid_list(device)
756 5
    skels = bulk_droid_skeletons(devs, build, method)
757 5
    with concurrent.futures.ThreadPoolExecutor(max_workers=len(skels)) as xec:
758 5
        results = []
759 5
        for skel in skels:
760 5
            avail = xec.submit(availability, skel, session)
761 5
            if avail.result():
762 5
                results.append(skel)
763 5
    return results if results else None
764
765
766 5
def chunker(iterable, inc):
767
    """
768
    Convert an iterable into a list of inc sized lists.
769
770
    :param chunker: Iterable to chunk.
771
    :type chunker: list
772
773
    :param inc: Increment; how big each chunk is.
774
    :type inc: int
775
    """
776 5
    chunks = [iterable[x:x+inc] for x in range(0, len(iterable), inc)]
777 5
    return chunks
778
779
780 5
def unicode_filter(intext):
781
    """
782
    Remove Unicode crap.
783
784
    :param intext: Text to filter.
785
    :type intext: str
786
    """
787 5
    return intext.replace("\u2013", "").strip()
788
789
790 5
def table_header_filter(ptag):
791
    """
792
    Validate p tag, to see if it's relevant.
793
794
    :param ptag: P tag.
795
    :type ptag: bs4.element.Tag
796
    """
797 5
    valid = ptag.find("b") and "BlackBerry" in ptag.text and not "experts" in ptag.text
798 5
    return valid
799
800
801 5
def table_headers(pees):
802
    """
803
    Generate table headers from list of p tags.
804
805
    :param pees: List of p tags.
806
    :type pees: list(bs4.element.Tag)
807
    """
808 5
    bolds = [x.text for x in pees if table_header_filter(x)]
809 5
    return bolds
810
811
812 5
@pem_wrapper
813 5
def loader_page_scraper(session=None):
814
    """
815
    Return scraped autoloader page.
816
817
    :param session: Requests session object, default is created on the fly.
818
    :type session: requests.Session()
819
    """
820 5
    url = "http://ca.blackberry.com/support/smartphones/Android-OS-Reload.html"
821 5
    session = requests.Session() if session is None else session
822 5
    soup = generic_soup_parser(url, session)
823 5
    tables = soup.find_all("table")
824 5
    headers = table_headers(soup.find_all("p"))
825 5
    for idx, table in enumerate(tables):
826 5
        loader_page_chunker(idx, table, headers)
827
828
829 5
def loader_page_chunker(idx, table, headers):
830
    """
831
    Given a loader page table, chunk it into lists of table cells.
832
833
    :param idx: Index of enumerating tables.
834
    :type idx: int
835
836
    :param table: HTML table tag.
837
    :type table: bs4.element.Tag
838
839
    :param headers: List of table headers.
840
    :type headers: list(str)
841
    """
842 5
    print("~~~{0}~~~".format(headers[idx]))
843 5
    chunks = chunker(table.find_all("td"), 4)
844 5
    for chunk in chunks:
845 5
        loader_page_printer(chunk)
846 5
    print(" ")
847
848
849 5
def loader_page_printer(chunk):
850
    """
851
    Print individual cell texts given a list of table cells.
852
853
    :param chunk: List of td tags.
854
    :type chunk: list(bs4.element.Tag)
855
    """
856 5
    key = unicode_filter(chunk[0].text)
857 5
    ver = unicode_filter(chunk[1].text)
858 5
    link = unicode_filter(chunk[2].find("a")["href"])
859 5
    print("{0}\n    {1}: {2}".format(key, ver, link))
860
861
862 5
@pem_wrapper
863 5
def base_metadata(url, session=None):
864
    """
865
    Get BBNDK metadata, base function.
866
867
    :param url: URL to check.
868
    :type url: str
869
870
    :param session: Requests session object, default is created on the fly.
871
    :type session: requests.Session()
872
    """
873 5
    session = requests.Session() if session is None else session
874 5
    req = session.get(url)
875 5
    data = req.content
876 5
    entries = data.split(b"\n")
877 5
    metadata = [entry.split(b",")[1].decode("utf-8") for entry in entries if entry]
878 5
    return metadata
879
880
881 5
def ndk_metadata(session=None):
882
    """
883
    Get BBNDK target metadata.
884
885
    :param session: Requests session object, default is created on the fly.
886
    :type session: requests.Session()
887
    """
888 5
    data = base_metadata("http://downloads.blackberry.com/upr/developers/update/bbndk/metadata", session)
889 5
    metadata = [entry for entry in data if entry.startswith(("10.0", "10.1", "10.2"))]
890 5
    return metadata
891
892
893 5
def sim_metadata(session=None):
894
    """
895
    Get BBNDK simulator metadata.
896
897
    :param session: Requests session object, default is created on the fly.
898
    :type session: requests.Session()
899
    """
900 5
    metadata = base_metadata("http://downloads.blackberry.com/upr/developers/update/bbndk/simulator/simulator_metadata", session)
901 5
    return metadata
902
903
904 5
def runtime_metadata(session=None):
905
    """
906
    Get BBNDK runtime metadata.
907
908
    :param session: Requests session object, default is created on the fly.
909
    :type session: requests.Session()
910
    """
911 5
    metadata = base_metadata("http://downloads.blackberry.com/upr/developers/update/bbndk/runtime/runtime_metadata", session)
912 5
    return metadata
913
914
915 5
def series_generator(osversion):
916
    """
917
    Generate series/branch name from OS version.
918
919
    :param osversion: OS version.
920
    :type osversion: str
921
    """
922 5
    splits = osversion.split(".")
923 5
    return "BB{0}_{1}_{2}".format(*splits[0:3])
924
925
926 5
@pem_wrapper
927 5
def devalpha_urls(osversion, skel, session=None):
928
    """
929
    Check individual Dev Alpha autoloader URLs.
930
931
    :param osversion: OS version.
932
    :type osversion: str
933
934
    :param skel: Individual skeleton format to try.
935
    :type skel: str
936
937
    :param session: Requests session object, default is created on the fly.
938
    :type session: requests.Session()
939
    """
940 5
    session = requests.Session() if session is None else session
941 5
    url = "http://downloads.blackberry.com/upr/developers/downloads/{0}{1}.exe".format(skel, osversion)
942 5
    req = session.head(url)
943 5
    if req.status_code == 200:
944 5
        finals = (url, req.headers["content-length"])
945
    else:
946 5
        finals = ()
947 5
    return finals
948
949
950 5
def devalpha_urls_bootstrap(osversion, skeletons, session=None):
951
    """
952
    Get list of valid Dev Alpha autoloader URLs.
953
954
    :param osversion: OS version.
955
    :type osversion: str
956
957
    :param skeletons: List of skeleton formats to try.
958
    :type skeletons: list
959
960
    :param session: Requests session object, default is created on the fly.
961
    :type session: requests.Session()
962
    """
963 5
    with concurrent.futures.ThreadPoolExecutor(max_workers=5) as xec:
964 5
        try:
965 5
            finals = {}
966 5
            skels = skeletons
967 5
            for idx, skel in enumerate(skeletons):
968 5
                if "<SERIES>" in skel:
969 5
                    skels[idx] = skel.replace("<SERIES>", series_generator(osversion))
970 5
            for skel in skels:
971 5
                final = xec.submit(devalpha_urls, osversion, skel, session).result()
972 5
                if final:
973 5
                    finals[final[0]] = final[1]
974 5
            return finals
975
        except KeyboardInterrupt:
976
            xec.shutdown(wait=False)
977
978
979 5
def dev_dupe_dicter(finals):
980
    """
981
    Prepare dictionary to clean duplicate autoloaders.
982
983
    :param finals: Dict of URL:content-length pairs.
984
    :type finals: dict(str: str)
985
    """
986 5
    revo = {}
987 5
    for key, val in finals.items():
988 5
        revo.setdefault(val, set()).add(key)
989 5
    return revo
990
991
992 5
def dev_dupe_remover(finals, dupelist):
993
    """
994
    Filter dictionary of autoloader entries.
995
996
    :param finals: Dict of URL:content-length pairs.
997
    :type finals: dict(str: str)
998
999
    :param dupelist: List of duplicate URLs.
1000
    :type duplist: list(str)
1001
    """
1002 5
    for dupe in dupelist:
1003 5
        for entry in dupe:
1004 5
            if "DevAlpha" in entry:
1005 5
                del finals[entry]
1006 5
    return finals
1007
1008
1009 5
def dev_dupe_cleaner(finals):
1010
    """
1011
    Clean duplicate autoloader entries.
1012
1013
    :param finals: Dict of URL:content-length pairs.
1014
    :type finals: dict(str: str)
1015
    """
1016 5
    revo = dev_dupe_dicter(finals)
1017 5
    dupelist = [val for key, val in revo.items() if len(val) > 1]
1018 5
    finals = dev_dupe_remover(finals, dupelist)
1019
    return finals
1020