Completed
Push — master ( 48a75b...b4958a )
by John
04:02
created

sr_lookup_xmlparser()   A

Complexity

Conditions 3

Size

Total Lines 15

Duplication

Lines 0
Ratio 0 %

Code Coverage

Tests 7
CRAP Score 3

Importance

Changes 0
Metric Value
cc 3
c 0
b 0
f 0
dl 0
loc 15
rs 9.4285
ccs 7
cts 7
cp 1
crap 3
1
#!/usr/bin/env python3
2 5
"""This module is used for network connections; APIs, downloading, etc."""
3
4 5
import os  # filesystem read
5 5
try:
6 5
    from defusedxml import ElementTree  # safer XML parsing
7
except (ImportError, AttributeError):
8
    from xml.etree import ElementTree  # XML parsing
9 5
import re  # regexes
10 5
import concurrent.futures  # multiprocessing/threading
11 5
import glob  # pem file lookup
12 5
import requests  # downloading
13 5
from bs4 import BeautifulSoup  # scraping
14 5
from bbarchivist import utilities  # parse filesize
15 5
from bbarchivist.bbconstants import SERVERS  # lookup servers
16
17 5
__author__ = "Thurask"
18 5
__license__ = "WTFPL v2"
19 5
__copyright__ = "2015-2017 Thurask"
20
21
22 5
def grab_pem():
23
    """
24
    Work with either local cacerts or system cacerts.
25
    """
26 5
    try:
27 5
        pemfile = glob.glob(os.path.join(os.getcwd(), "cacert.pem"))[0]
28 5
    except IndexError:
29 5
        return requests.certs.where()  # no local cacerts
30
    else:
31 5
        return os.path.abspath(pemfile)  # local cacerts
32
33
34 5
def pem_wrapper(method):
35
    """
36
    Decorator to set REQUESTS_CA_BUNDLE.
37
38
    :param method: Method to use.
39
    :type method: function
40
    """
41 5
    def wrapper(*args, **kwargs):
42
        """
43
        Set REQUESTS_CA_BUNDLE before doing function.
44
        """
45 5
        os.environ["REQUESTS_CA_BUNDLE"] = grab_pem()
46 5
        return method(*args, **kwargs)
47 5
    return wrapper
48
49
50 5
def generic_session(session=None):
51
    """
52
    Create a Requests session object on the fly, if need be.
53
54
    :param session: Requests session object, created if this is None.
55
    :type session: requests.Session()
56
    """
57 5
    sess = requests.Session() if session is None else session
58 5
    return sess
59
60
61 5
def generic_soup_parser(url, session=None):
62
    """
63
    Get a BeautifulSoup HTML parser for some URL.
64
65
    :param url: The URL to check.
66
    :type url: str
67
68
    :param session: Requests session object, default is created on the fly.
69
    :type session: requests.Session()
70
    """
71 5
    session = generic_session(session)
72 5
    req = session.get(url)
73 5
    soup = BeautifulSoup(req.content, "html.parser")
74 5
    return soup
75
76
77 5
@pem_wrapper
78 5
def get_length(url, session=None):
79
    """
80
    Get content-length header from some URL.
81
82
    :param url: The URL to check.
83
    :type url: str
84
85
    :param session: Requests session object, default is created on the fly.
86
    :type session: requests.Session()
87
    """
88 5
    session = generic_session(session)
89 5
    if url is None:
90 5
        return 0
91 5
    try:
92 5
        heads = session.head(url)
93 5
        fsize = heads.headers['content-length']
94 5
        return int(fsize)
95 5
    except requests.ConnectionError:
96 5
        return 0
97
98
99 5
@pem_wrapper
100 5
def download(url, output_directory=None, session=None):
101
    """
102
    Download file from given URL.
103
104
    :param url: URL to download from.
105
    :type url: str
106
107
    :param output_directory: Download folder. Default is local.
108
    :type output_directory: str
109
110
    :param session: Requests session object, default is created on the fly.
111
    :type session: requests.Session()
112
    """
113 5
    session = generic_session(session)
114 5
    output_directory = os.getcwd() if output_directory is None else output_directory
115 5
    lfname = url.split('/')[-1]
116 5
    sname = utilities.stripper(lfname)
117 5
    fname = os.path.join(output_directory, lfname)
118 5
    download_writer(url, fname, lfname, sname, session)
119 5
    remove_empty_download(fname)
120
121
122 5
def remove_empty_download(fname):
123
    """
124
    Remove file if it's empty.
125
126
    :param fname: File path.
127
    :type fname: str
128
    """
129 5
    if os.stat(fname).st_size == 0:
130 5
        os.remove(fname)
131
132
133 5
def download_writer(url, fname, lfname, sname, session=None):
134
    """
135
    Download file and write to disk.
136
137
    :param url: URL to download from.
138
    :type url: str
139
140
    :param fname: File path.
141
    :type fname: str
142
143
    :param lfname: Long filename.
144
    :type lfname: str
145
146
    :param sname: Short name, for printing to screen.
147
    :type sname: str
148
149
    :param session: Requests session object, default is created on the fly.
150
    :type session: requests.Session()
151
    """
152 5
    with open(fname, "wb") as file:
153 5
        req = session.get(url, stream=True)
154 5
        clength = req.headers['content-length']
155 5
        fsize = utilities.fsizer(clength)
156 5
        if req.status_code == 200:  # 200 OK
157 5
            print("DOWNLOADING {0} [{1}]".format(sname, fsize))
158 5
            for chunk in req.iter_content(chunk_size=1024):
159 5
                file.write(chunk)
160
        else:
161 5
            print("ERROR: HTTP {0} IN {1}".format(req.status_code, lfname))
162
163
164 5
def download_bootstrap(urls, outdir=None, workers=5, session=None):
165
    """
166
    Run downloaders for each file in given URL iterable.
167
168
    :param urls: URLs to download.
169
    :type urls: list
170
171
    :param outdir: Download folder. Default is handled in :func:`download`.
172
    :type outdir: str
173
174
    :param workers: Number of worker processes. Default is 5.
175
    :type workers: int
176
177
    :param session: Requests session object, default is created on the fly.
178
    :type session: requests.Session()
179
    """
180 5
    workers = len(urls) if len(urls) < workers else workers
181 5
    spinman = utilities.SpinManager()
182 5
    with concurrent.futures.ThreadPoolExecutor(max_workers=workers) as xec:
183 5
        try:
184 5
            spinman.start()
185 5
            for url in urls:
186 5
                xec.submit(download, url, outdir, session)
187
        except (KeyboardInterrupt, SystemExit):
188
            xec.shutdown()
189
            spinman.stop()
190 5
    spinman.stop()
191 5
    utilities.spinner_clear()
192 5
    utilities.line_begin()
193
194
195 5
@pem_wrapper
196 5
def availability(url, session=None):
197
    """
198
    Check HTTP status code of given URL.
199
    200 or 301-308 is OK, else is not.
200
201
    :param url: URL to check.
202
    :type url: str
203
204
    :param session: Requests session object, default is created on the fly.
205
    :type session: requests.Session()
206
    """
207 5
    session = generic_session(session)
208 5
    try:
209 5
        avlty = session.head(url)
210 5
        status = int(avlty.status_code)
211 5
        return status == 200 or 300 < status <= 308
212 5
    except requests.ConnectionError:
213 5
        return False
214
215
216 5
def clean_availability(results, server):
217
    """
218
    Clean availability for autolookup script.
219
220
    :param results: Result dict.
221
    :type results: dict(str: str)
222
223
    :param server: Server, key for result dict.
224
    :type server: str
225
    """
226 5
    marker = "PD" if server == "p" else server.upper()
227 5
    rel = results[server.lower()]
228 5
    avail = marker if rel != "SR not in system" and rel is not None else "  "
229 5
    return rel, avail
230
231
232 5
@pem_wrapper
233 5
def carrier_checker(mcc, mnc, session=None):
234
    """
235
    Query BlackBerry World to map a MCC and a MNC to a country and carrier.
236
237
    :param mcc: Country code.
238
    :type mcc: int
239
240
    :param mnc: Network code.
241
    :type mnc: int
242
243
    :param session: Requests session object, default is created on the fly.
244
    :type session: requests.Session()
245
    """
246 5
    session = generic_session(session)
247 5
    url = "http://appworld.blackberry.com/ClientAPI/checkcarrier?homemcc={0}&homemnc={1}&devicevendorid=-1&pin=0".format(
248
        mcc, mnc)
249 5
    user_agent = {'User-agent': 'AppWorld/5.1.0.60'}
250 5
    req = session.get(url, headers=user_agent)
251 5
    root = ElementTree.fromstring(req.text)
252 5
    for child in root:
253 5
        if child.tag == "country":
254 5
            country = child.get("name")
255 5
        if child.tag == "carrier":
256 5
            carrier = child.get("name")
257 5
    return country, carrier
258
259
260 5
def return_npc(mcc, mnc):
261
    """
262
    Format MCC and MNC into a NPC.
263
264
    :param mcc: Country code.
265
    :type mcc: int
266
267
    :param mnc: Network code.
268
    :type mnc: int
269
    """
270 5
    return "{0}{1}30".format(str(mcc).zfill(3), str(mnc).zfill(3))
271
272
273 5
@pem_wrapper
274 5
def carrier_query(npc, device, upgrade=False, blitz=False, forced=None, session=None):
275
    """
276
    Query BlackBerry servers, check which update is out for a carrier.
277
278
    :param npc: MCC + MNC (see `func:return_npc`)
279
    :type npc: int
280
281
    :param device: Hexadecimal hardware ID.
282
    :type device: str
283
284
    :param upgrade: Whether to use upgrade files. False by default.
285
    :type upgrade: bool
286
287
    :param blitz: Whether or not to create a blitz package. False by default.
288
    :type blitz: bool
289
290
    :param forced: Force a software release.
291
    :type forced: str
292
293
    :param session: Requests session object, default is created on the fly.
294
    :type session: requests.Session()
295
    """
296 5
    session = generic_session(session)
297 5
    upg = "upgrade" if upgrade else "repair"
298 5
    forced = "latest" if forced is None else forced
299 5
    url = "https://cs.sl.blackberry.com/cse/updateDetails/2.2/"
300 5
    query = '<?xml version="1.0" encoding="UTF-8"?>'
301 5
    query += '<updateDetailRequest version="2.2.1" authEchoTS="1366644680359">'
302 5
    query += "<clientProperties>"
303 5
    query += "<hardware>"
304 5
    query += "<pin>0x2FFFFFB3</pin><bsn>1128121361</bsn>"
305 5
    query += "<imei>004401139269240</imei>"
306 5
    query += "<id>0x{0}</id>".format(device)
307 5
    query += "</hardware>"
308 5
    query += "<network>"
309 5
    query += "<homeNPC>0x{0}</homeNPC>".format(npc)
310 5
    query += "<iccid>89014104255505565333</iccid>"
311 5
    query += "</network>"
312 5
    query += "<software>"
313 5
    query += "<currentLocale>en_US</currentLocale>"
314 5
    query += "<legalLocale>en_US</legalLocale>"
315 5
    query += "</software>"
316 5
    query += "</clientProperties>"
317 5
    query += "<updateDirectives>"
318 5
    query += '<allowPatching type="REDBEND">true</allowPatching>'
319 5
    query += "<upgradeMode>{0}</upgradeMode>".format(upg)
320 5
    query += "<provideDescriptions>false</provideDescriptions>"
321 5
    query += "<provideFiles>true</provideFiles>"
322 5
    query += "<queryType>NOTIFICATION_CHECK</queryType>"
323 5
    query += "</updateDirectives>"
324 5
    query += "<pollType>manual</pollType>"
325 5
    query += "<resultPackageSetCriteria>"
326 5
    query += '<softwareRelease softwareReleaseVersion="{0}" />'.format(forced)
327 5
    query += "<releaseIndependent>"
328 5
    query += '<packageType operation="include">application</packageType>'
329 5
    query += "</releaseIndependent>"
330 5
    query += "</resultPackageSetCriteria>"
331 5
    query += "</updateDetailRequest>"
332 5
    header = {"Content-Type": "text/xml;charset=UTF-8"}
333 5
    req = session.post(url, headers=header, data=query)
334 5
    return parse_carrier_xml(req.text, blitz)
335
336
337 5
def carrier_swver_get(root):
338
    """
339
    Get software release from carrier XML.
340
341
    :param root: ElementTree we're barking up.
342
    :type root: xml.etree.ElementTree.ElementTree
343
    """
344 5
    for child in root.iter("softwareReleaseMetadata"):
345 5
        swver = child.get("softwareReleaseVersion")
346 5
    return swver
347
348
349 5
def carrier_child_fileappend(child, files, baseurl, blitz=False):
350
    """
351
    Append bar file links to a list from a child element.
352
353
    :param child: Child element in use.
354
    :type child: xml.etree.ElementTree.Element
355
356
    :param files: Filelist.
357
    :type files: list(str)
358
359
    :param baseurl: Base URL, URL minus the filename.
360
    :type baseurl: str
361
362
    :param blitz: Whether or not to create a blitz package. False by default.
363
    :type blitz: bool
364
    """
365 5
    if not blitz:
366 5
        files.append(baseurl + child.get("path"))
367
    else:
368 5
        if child.get("type") not in ["system:radio", "system:desktop", "system:os"]:
369 5
            files.append(baseurl + child.get("path"))
370 5
    return files
371
372
373 5
def carrier_child_finder(root, files, baseurl, blitz=False):
374
    """
375
    Extract filenames, radio and OS from child elements.
376
377
    :param root: ElementTree we're barking up.
378
    :type root: xml.etree.ElementTree.ElementTree
379
380
    :param files: Filelist.
381
    :type files: list(str)
382
383
    :param baseurl: Base URL, URL minus the filename.
384
    :type baseurl: str
385
386
    :param blitz: Whether or not to create a blitz package. False by default.
387
    :type blitz: bool
388
    """
389 5
    osver = radver = ""
390 5
    for child in root.iter("package"):
391 5
        files = carrier_child_fileappend(child, files, baseurl, blitz)
392 5
        if child.get("type") == "system:radio":
393 5
            radver = child.get("version")
394 5
        elif child.get("type") == "system:desktop":
395 5
            osver = child.get("version")
396 5
        elif child.get("type") == "system:os":
397 5
            osver = child.get("version")
398 5
    return osver, radver, files
399
400
401 5
def parse_carrier_xml(data, blitz=False):
402
    """
403
    Parse the response to a carrier update request and return the juicy bits.
404
405
    :param data: The data to parse.
406
    :type data: xml
407
408
    :param blitz: Whether or not to create a blitz package. False by default.
409
    :type blitz: bool
410
    """
411 5
    root = ElementTree.fromstring(data)
412 5
    sw_exists = root.find('./data/content/softwareReleaseMetadata')
413 5
    swver = "N/A" if sw_exists is None else ""
414 5
    if sw_exists is not None:
415 5
        swver = carrier_swver_get(root)
416 5
    files = []
417 5
    package_exists = root.find('./data/content/fileSets/fileSet')
418 5
    osver = radver = ""
419 5
    if package_exists is not None:
420 5
        baseurl = "{0}/".format(package_exists.get("url"))
421 5
        osver, radver, files = carrier_child_finder(root, files, baseurl, blitz)
422 5
    return(swver, osver, radver, files)
423
424
425 5
@pem_wrapper
426 5
def sr_lookup(osver, server, session=None):
427
    """
428
    Software release lookup, with choice of server.
429
    :data:`bbarchivist.bbconstants.SERVERLIST` for server list.
430
431
    :param osver: OS version to lookup, 10.x.y.zzzz.
432
    :type osver: str
433
434
    :param server: Server to use.
435
    :type server: str
436
437
    :param session: Requests session object, default is created on the fly.
438
    :type session: requests.Session()
439
    """
440 5
    query = '<?xml version="1.0" encoding="UTF-8"?>'
441 5
    query += '<srVersionLookupRequest version="2.0.0"'
442 5
    query += ' authEchoTS="1366644680359">'
443 5
    query += '<clientProperties><hardware>'
444 5
    query += '<pin>0x2FFFFFB3</pin><bsn>1140011878</bsn>'
445 5
    query += '<imei>004402242176786</imei><id>0x8D00240A</id>'
446 5
    query += '<isBootROMSecure>true</isBootROMSecure>'
447 5
    query += '</hardware>'
448 5
    query += '<network>'
449 5
    query += '<vendorId>0x0</vendorId><homeNPC>0x60</homeNPC>'
450 5
    query += '<currentNPC>0x60</currentNPC><ecid>0x1</ecid>'
451 5
    query += '</network>'
452 5
    query += '<software><currentLocale>en_US</currentLocale>'
453 5
    query += '<legalLocale>en_US</legalLocale>'
454 5
    query += '<osVersion>{0}</osVersion>'.format(osver)
455 5
    query += '<omadmEnabled>false</omadmEnabled>'
456 5
    query += '</software></clientProperties>'
457 5
    query += '</srVersionLookupRequest>'
458 5
    reqtext = sr_lookup_poster(query, server, session)
459 5
    packtext = sr_lookup_xmlparser(reqtext)
460 5
    return packtext
461
462
463 5
def sr_lookup_poster(query, server, session=None):
464
    """
465
    Post the XML payload for a software release lookup.
466
467
    :param query: XML payload.
468
    :type query: str
469
470
    :param server: Server to use.
471
    :type server: str
472
473
    :param session: Requests session object, default is created on the fly.
474
    :type session: requests.Session()
475
    """
476 5
    session = generic_session(session)
477 5
    header = {"Content-Type": "text/xml;charset=UTF-8"}
478 5
    try:
479 5
        req = session.post(server, headers=header, data=query, timeout=1)
480 5
    except (requests.exceptions.Timeout, requests.exceptions.ConnectionError):
481 5
        reqtext = "SR not in system"
482
    else:
483 5
        reqtext = req.text
484
    finally:
485 5
        return reqtext
0 ignored issues
show
Bug Best Practice introduced by
return statements in finally blocks should be avoided.

Placing a return statement inside finally will swallow all exceptions that may have been thrown in the try block.

Loading history...
486
487
488 5
def sr_lookup_xmlparser(reqtext):
489
    """
490
    Take the text of a software lookup request response and parse it as XML.
491
492
    :param reqtext: Response text, hopefully XML formatted.
493
    :type reqtext: str
494
    """
495 5
    try:
496 5
        root = ElementTree.fromstring(reqtext)
497 5
    except ElementTree.ParseError:
498 5
        packtext = "SR not in system"
499
    else:
500 5
        packtext = sr_lookup_extractor(root)
501
    finally:
502 5
        return packtext
0 ignored issues
show
Bug Best Practice introduced by
return statements in finally blocks should be avoided.

Placing a return statement inside finally will swallow all exceptions that may have been thrown in the try block.

Loading history...
503
504
505 5
def sr_lookup_extractor(root):
506
    """
507
    Take an ElementTree and extract a software release from it.
508
509
    :param root: ElementTree we're barking up.
510
    :type root: xml.etree.ElementTree.ElementTree
511
    """
512 5
    reg = re.compile(r"(\d{1,4}\.)(\d{1,4}\.)(\d{1,4}\.)(\d{1,4})")
513 5
    packages = root.findall('./data/content/')
514 5
    for package in packages:
515 5
        if package.text is not None:
516 5
            match = reg.match(package.text)
517 5
            packtext = package.text if match else "SR not in system"
518 5
            return packtext
519
520
521 5
def sr_lookup_bootstrap(osv, session=None, no2=False):
522
    """
523
    Run lookups for each server for given OS.
524
525
    :param osv: OS to check.
526
    :type osv: str
527
528
    :param session: Requests session object, default is created on the fly.
529
    :type session: requests.Session()
530
531
    :param no2: Whether to skip Alpha2/Beta2 servers. Default is false.
532
    :type no2: bool
533
    """
534 5
    with concurrent.futures.ThreadPoolExecutor(max_workers=5) as xec:
535 5
        try:
536 5
            results = {
537
                "p": None,
538
                "a1": None,
539
                "a2": None,
540
                "b1": None,
541
                "b2": None
542
            }
543 5
            if no2:
544 5
                del results["a2"]
545 5
                del results["b2"]
546 5
            for key in results:
547 5
                results[key] = xec.submit(sr_lookup, osv, SERVERS[key], session).result()
548 5
            return results
549
        except KeyboardInterrupt:
550
            xec.shutdown(wait=False)
551
552
553 5
@pem_wrapper
554 5
def available_bundle_lookup(mcc, mnc, device, session=None):
555
    """
556
    Check which software releases were ever released for a carrier.
557
558
    :param mcc: Country code.
559
    :type mcc: int
560
561
    :param mnc: Network code.
562
    :type mnc: int
563
564
    :param device: Hexadecimal hardware ID.
565
    :type device: str
566
567
    :param session: Requests session object, default is created on the fly.
568
    :type session: requests.Session()
569
    """
570 5
    session = generic_session(session)
571 5
    server = "https://cs.sl.blackberry.com/cse/availableBundles/1.0.0/"
572 5
    npc = return_npc(mcc, mnc)
573 5
    query = '<?xml version="1.0" encoding="UTF-8"?>'
574 5
    query += '<availableBundlesRequest version="1.0.0" '
575 5
    query += 'authEchoTS="1366644680359">'
576 5
    query += '<deviceId><pin>0x2FFFFFB3</pin></deviceId>'
577 5
    query += '<clientProperties><hardware><id>0x{0}</id>'.format(device)
578 5
    query += '<isBootROMSecure>true</isBootROMSecure></hardware>'
579 5
    query += '<network><vendorId>0x0</vendorId><homeNPC>0x{0}</homeNPC>'.format(npc)
580 5
    query += '<currentNPC>0x{0}</currentNPC></network><software>'.format(npc)
581 5
    query += '<currentLocale>en_US</currentLocale>'
582 5
    query += '<legalLocale>en_US</legalLocale>'
583 5
    query += '<osVersion>10.0.0.0</osVersion>'
584 5
    query += '<radioVersion>10.0.0.0</radioVersion></software>'
585 5
    query += '</clientProperties><updateDirectives><bundleVersionFilter>'
586 5
    query += '</bundleVersionFilter></updateDirectives>'
587 5
    query += '</availableBundlesRequest>'
588 5
    header = {"Content-Type": "text/xml;charset=UTF-8"}
589 5
    req = session.post(server, headers=header, data=query)
590 5
    root = ElementTree.fromstring(req.text)
591 5
    package = root.find('./data/content')
592 5
    bundlelist = [child.attrib["version"] for child in package]
593 5
    return bundlelist
594
595
596 5
@pem_wrapper
597 5
def ptcrb_scraper(ptcrbid, session=None):
598
    """
599
    Get the PTCRB results for a given device.
600
601
    :param ptcrbid: Numerical ID from PTCRB (end of URL).
602
    :type ptcrbid: str
603
604
    :param session: Requests session object, default is created on the fly.
605
    :type session: requests.Session()
606
    """
607 5
    baseurl = "https://ptcrb.com/vendor/complete/view_complete_request_guest.cfm?modelid={0}".format(
608
        ptcrbid)
609 5
    sess = generic_session(session)
610 5
    sess.headers.update({"Referer": "https://ptcrb.com/vendor/complete/complete_request.cfm"})
611 5
    soup = generic_soup_parser(baseurl, sess)
612 5
    text = soup.get_text()
613 5
    text = text.replace("\r\n", " ")
614 5
    prelimlist = re.findall("OS .+[^\\n]", text, re.IGNORECASE)
615 5
    if not prelimlist:  # Priv
616 5
        prelimlist = re.findall(r"[A-Z]{3}[0-9]{3}[\s]", text)
617 5
    cleanlist = []
618 5
    for item in prelimlist:
619 5
        if not item.endswith("\r\n"):  # they should hire QC people...
620 5
            cleanlist.append(ptcrb_item_cleaner(item))
621 5
    return cleanlist
622
623
624 5
def space_pad(instring, minlength):
625
    """
626
    Pad a string with spaces until it's the minimum length.
627
628
    :param instring: String to pad.
629
    :type instring: str
630
631
    :param minlength: Pad while len(instring) < minlength.
632
    :type minlength: int
633
    """
634 5
    while len(instring) < minlength:
635 5
        instring += " "
636 5
    return instring
637
638
639 5
def ptcrb_item_cleaner(item):
640
    """
641
    Cleanup poorly formatted PTCRB entries written by an intern.
642
643
    :param item: The item to clean.
644
    :type item: str
645
    """
646 5
    item = item.replace("<td>", "")
647 5
    item = item.replace("</td>", "")
648 5
    item = item.replace("\n", "")
649 5
    item = item.replace(" (SR", ", SR")
650 5
    item = re.sub(r"\s?\((.*)$", "", item)
651 5
    item = re.sub(r"\sSV.*$", "", item)
652 5
    item = item.replace(")", "")
653 5
    item = item.replace(". ", ".")
654 5
    item = item.replace(";", "")
655 5
    item = item.replace("version", "Version")
656 5
    item = item.replace("Verison", "Version")
657 5
    if item.count("OS") > 1:
658 5
        templist = item.split("OS")
659 5
        templist[0] = "OS"
660 5
        item = "".join([templist[0], templist[1]])
661 5
    item = item.replace("SR", "SW Release")
662 5
    item = item.replace(" Version:", ":")
663 5
    item = item.replace("Version ", " ")
664 5
    item = item.replace(":1", ": 1")
665 5
    item = item.replace(", ", " ")
666 5
    item = item.replace("Software", "SW")
667 5
    item = item.replace("  ", " ")
668 5
    item = item.replace("OS ", "OS: ")
669 5
    item = item.replace("Radio ", "Radio: ")
670 5
    item = item.replace("Release ", "Release: ")
671 5
    spaclist = item.split(" ")
672 5
    if len(spaclist) > 1:
673 5
        spaclist[1] = space_pad(spaclist[1], 11)
674 5
        spaclist[3] = space_pad(spaclist[3], 11)
675
    else:
676 5
        spaclist.insert(0, "OS:")
677 5
    item = " ".join(spaclist)
678 5
    item = item.strip()
679 5
    return item
680
681
682 5
@pem_wrapper
683 5
def kernel_scraper(utils=False, session=None):
684
    """
685
    Scrape BlackBerry's GitHub kernel repo for available branches.
686
687
    :param utils: Check android-utils repo instead of android-linux-kernel. Default is False.
688
    :type utils: bool
689
690
    :param session: Requests session object, default is created on the fly.
691
    :type session: requests.Session()
692
    """
693 5
    repo = "android-utils" if utils else "android-linux-kernel"
694 5
    kernlist = []
695 5
    sess = generic_session(session)
696 5
    for page in range(1, 10):
697 5
        url = "https://github.com/blackberry/{0}/branches/all?page={1}".format(repo, page)
698 5
        soup = generic_soup_parser(url, sess)
699 5
        if soup.find("div", {"class": "no-results-message"}):
700 5
            break
701
        else:
702 5
            text = soup.get_text()
703 5
            kernlist.extend(re.findall(r"msm[0-9]{4}\/[A-Z0-9]{6}", text, re.IGNORECASE))
704 5
    return kernlist
705
706
707 5
def root_generator(folder, build, variant="common"):
708
    """
709
    Generate roots for the SHAxxx hash lookup URLs.
710
711
    :param folder: Dictionary of variant: loader name pairs.
712
    :type folder: dict(str: str)
713
714
    :param build: Build to check, 3 letters + 3 numbers.
715
    :type build: str
716
717
    :param variant: Autoloader variant. Default is "common".
718
    :type variant: str
719
    """
720
    #Priv specific
721 5
    privx = "bbfoundation/hashfiles_priv/{0}".format(folder[variant])
722
    #DTEK50 specific
723 5
    dtek50x = "bbSupport/DTEK50" if build[:3] == "AAF" else "bbfoundation/hashfiles_priv/dtek50"
724
    #DTEK60 specific
725 5
    dtek60x = dtek50x  # still uses dtek50 folder, for some reason
726
    #Pack it up
727 5
    roots = {"Priv": privx, "DTEK50": dtek50x, "DTEK60": dtek60x}
728 5
    return roots
729
730
731 5
def make_droid_skeleton(method, build, device, variant="common"):
732
    """
733
    Make an Android autoloader/hash URL.
734
735
    :param method: None for regular OS links, "sha256/512" for SHA256 or 512 hash.
736
    :type method: str
737
738
    :param build: Build to check, 3 letters + 3 numbers.
739
    :type build: str
740
741
    :param device: Device to check.
742
    :type device: str
743
744
    :param variant: Autoloader variant. Default is "common".
745
    :type variant: str
746
    """
747 5
    folder = {"vzw-vzw": "verizon", "na-att": "att", "na-tmo": "tmo", "common": "default"}
748 5
    devices = {"Priv": "qc8992", "DTEK50": "qc8952_64_sfi", "DTEK60": "qc8996"}
749 5
    roots = root_generator(folder, build, variant)
750 5
    base = "bbry_{2}_autoloader_user-{0}-{1}".format(variant, build.upper(), devices[device])
751 5
    if method is None:
752 5
        skel = "https://bbapps.download.blackberry.com/Priv/{0}.zip".format(base)
753
    else:
754 5
        skel = "http://ca.blackberry.com/content/dam/{1}/{0}.{2}sum".format(base, roots[device], method.lower())
755 5
    return skel
756
757
758 5
def bulk_droid_skeletons(devs, build, method=None):
759
    """
760
    Prepare list of Android autoloader/hash URLs.
761
762
    :param devs: List of devices.
763
    :type devs: list(str)
764
765
    :param build: Build to check, 3 letters + 3 numbers.
766
    :type build: str
767
768
    :param method: None for regular OS links, "sha256/512" for SHA256 or 512 hash.
769
    :type method: str
770
    """
771 5
    carrier_variants = ("common", "vzw-vzw", "na-tmo", "na-att")  # device variants
772 5
    common_variants = ("common", )  # no Americans
773 5
    carrier_devices = ("Priv", )  # may this list never expand in the future
774 5
    skels = []
775 5
    for dev in devs:
776 5
        varlist = carrier_variants if dev in carrier_devices else common_variants
777 5
        for var in varlist:
778 5
            skel = make_droid_skeleton(method, build, dev, var)
779 5
            skels.append(skel)
780 5
    return skels
781
782
783 5
def prepare_droid_list(device):
784
    """
785
    Convert single devices to a list, if necessary.
786
787
    :param device: Device to check.
788
    :type device: str
789
    """
790 5
    if isinstance(device, list):
791 5
        devs = device
792
    else:
793 5
        devs = [device]
794 5
    return devs
795
796
797 5
def droid_scanner(build, device, method=None, session=None):
798
    """
799
    Check for Android autoloaders on BlackBerry's site.
800
801
    :param build: Build to check, 3 letters + 3 numbers.
802
    :type build: str
803
804
    :param device: Device to check.
805
    :type device: str
806
807
    :param method: None for regular OS links, "sha256/512" for SHA256 or 512 hash.
808
    :type method: str
809
810
    :param session: Requests session object, default is created on the fly.
811
    :type session: requests.Session()
812
    """
813 5
    devs = prepare_droid_list(device)
814 5
    skels = bulk_droid_skeletons(devs, build, method)
815 5
    with concurrent.futures.ThreadPoolExecutor(max_workers=len(skels)) as xec:
816 5
        results = []
817 5
        for skel in skels:
818 5
            avail = xec.submit(availability, skel, session)
819 5
            if avail.result():
820 5
                results.append(skel)
821 5
    return results if results else None
822
823
824 5
def chunker(iterable, inc):
825
    """
826
    Convert an iterable into a list of inc sized lists.
827
828
    :param iterable: Iterable to chunk.
829
    :type iterable: list/tuple/string
830
831
    :param inc: Increment; how big each chunk is.
832
    :type inc: int
833
    """
834 5
    chunks = [iterable[x:x+inc] for x in range(0, len(iterable), inc)]
835 5
    return chunks
836
837
838 5
def unicode_filter(intext):
839
    """
840
    Remove Unicode crap.
841
842
    :param intext: Text to filter.
843
    :type intext: str
844
    """
845 5
    return intext.replace("\u2013", "").strip()
846
847
848 5
def table_header_filter(ptag):
849
    """
850
    Validate p tag, to see if it's relevant.
851
852
    :param ptag: P tag.
853
    :type ptag: bs4.element.Tag
854
    """
855 5
    valid = ptag.find("b") and "BlackBerry" in ptag.text and not "experts" in ptag.text
856 5
    return valid
857
858
859 5
def table_headers(pees):
860
    """
861
    Generate table headers from list of p tags.
862
863
    :param pees: List of p tags.
864
    :type pees: list(bs4.element.Tag)
865
    """
866 5
    bolds = [x.text for x in pees if table_header_filter(x)]
867 5
    return bolds
868
869
870 5
@pem_wrapper
871 5
def loader_page_scraper(session=None):
872
    """
873
    Return scraped autoloader page.
874
875
    :param session: Requests session object, default is created on the fly.
876
    :type session: requests.Session()
877
    """
878 5
    url = "http://ca.blackberry.com/support/smartphones/Android-OS-Reload.html"
879 5
    session = generic_session(session)
880 5
    soup = generic_soup_parser(url, session)
881 5
    tables = soup.find_all("table")
882 5
    headers = table_headers(soup.find_all("p"))
883 5
    for idx, table in enumerate(tables):
884 5
        loader_page_chunker(idx, table, headers)
885
886
887 5
def loader_page_chunker(idx, table, headers):
888
    """
889
    Given a loader page table, chunk it into lists of table cells.
890
891
    :param idx: Index of enumerating tables.
892
    :type idx: int
893
894
    :param table: HTML table tag.
895
    :type table: bs4.element.Tag
896
897
    :param headers: List of table headers.
898
    :type headers: list(str)
899
    """
900 5
    print("~~~{0}~~~".format(headers[idx]))
901 5
    chunks = chunker(table.find_all("td"), 4)
902 5
    for chunk in chunks:
903 5
        loader_page_printer(chunk)
904 5
    print(" ")
905
906
907 5
def loader_page_printer(chunk):
908
    """
909
    Print individual cell texts given a list of table cells.
910
911
    :param chunk: List of td tags.
912
    :type chunk: list(bs4.element.Tag)
913
    """
914 5
    key = unicode_filter(chunk[0].text)
915 5
    ver = unicode_filter(chunk[1].text)
916 5
    link = unicode_filter(chunk[2].find("a")["href"])
917 5
    print("{0}\n    {1}: {2}".format(key, ver, link))
918
919
920 5
@pem_wrapper
921 5
def base_metadata(url, session=None):
922
    """
923
    Get BBNDK metadata, base function.
924
925
    :param url: URL to check.
926
    :type url: str
927
928
    :param session: Requests session object, default is created on the fly.
929
    :type session: requests.Session()
930
    """
931 5
    session = generic_session(session)
932 5
    req = session.get(url)
933 5
    data = req.content
934 5
    entries = data.split(b"\n")
935 5
    metadata = [entry.split(b",")[1].decode("utf-8") for entry in entries if entry]
936 5
    return metadata
937
938
939 5
def ndk_metadata(session=None):
940
    """
941
    Get BBNDK target metadata.
942
943
    :param session: Requests session object, default is created on the fly.
944
    :type session: requests.Session()
945
    """
946 5
    data = base_metadata("http://downloads.blackberry.com/upr/developers/update/bbndk/metadata", session)
947 5
    metadata = [entry for entry in data if entry.startswith(("10.0", "10.1", "10.2"))]
948 5
    return metadata
949
950
951 5
def sim_metadata(session=None):
952
    """
953
    Get BBNDK simulator metadata.
954
955
    :param session: Requests session object, default is created on the fly.
956
    :type session: requests.Session()
957
    """
958 5
    metadata = base_metadata("http://downloads.blackberry.com/upr/developers/update/bbndk/simulator/simulator_metadata", session)
959 5
    return metadata
960
961
962 5
def runtime_metadata(session=None):
963
    """
964
    Get BBNDK runtime metadata.
965
966
    :param session: Requests session object, default is created on the fly.
967
    :type session: requests.Session()
968
    """
969 5
    metadata = base_metadata("http://downloads.blackberry.com/upr/developers/update/bbndk/runtime/runtime_metadata", session)
970 5
    return metadata
971
972
973 5
def series_generator(osversion):
974
    """
975
    Generate series/branch name from OS version.
976
977
    :param osversion: OS version.
978
    :type osversion: str
979
    """
980 5
    splits = osversion.split(".")
981 5
    return "BB{0}_{1}_{2}".format(*splits[0:3])
982
983
984 5
@pem_wrapper
985 5
def devalpha_urls(osversion, skel, session=None):
986
    """
987
    Check individual Dev Alpha autoloader URLs.
988
989
    :param osversion: OS version.
990
    :type osversion: str
991
992
    :param skel: Individual skeleton format to try.
993
    :type skel: str
994
995
    :param session: Requests session object, default is created on the fly.
996
    :type session: requests.Session()
997
    """
998 5
    session = generic_session(session)
999 5
    url = "http://downloads.blackberry.com/upr/developers/downloads/{0}{1}.exe".format(skel, osversion)
1000 5
    req = session.head(url)
1001 5
    if req.status_code == 200:
1002 5
        finals = (url, req.headers["content-length"])
1003
    else:
1004 5
        finals = ()
1005 5
    return finals
1006
1007
1008 5
def devalpha_urls_serieshandler(osversion, skeletons):
1009
    """
1010
    Process list of candidate Dev Alpha autoloader URLs.
1011
1012
    :param osversion: OS version.
1013
    :type osversion: str
1014
1015
    :param skeletons: List of skeleton formats to try.
1016
    :type skeletons: list
1017
    """
1018 5
    skels = skeletons
1019 5
    for idx, skel in enumerate(skeletons):
1020 5
        if "<SERIES>" in skel:
1021 5
            skels[idx] = skel.replace("<SERIES>", series_generator(osversion))
1022 5
    return skels
1023
1024
1025 5
def devalpha_urls_bulk(osversion, skeletons, xec, session=None):
1026
    """
1027
    Construct list of valid Dev Alpha autoloader URLs.
1028
1029
    :param osversion: OS version.
1030
    :type osversion: str
1031
1032
    :param skeletons: List of skeleton formats to try.
1033
    :type skeletons: list
1034
1035
    :param xec: ThreadPoolExecutor instance.
1036
    :type xec: concurrent.futures.ThreadPoolExecutor
1037
1038
    :param session: Requests session object, default is created on the fly.
1039
    :type session: requests.Session()
1040
    """
1041 5
    finals = {}
1042 5
    skels = devalpha_urls_serieshandler(osversion, skeletons)
1043 5
    for skel in skels:
1044 5
        final = xec.submit(devalpha_urls, osversion, skel, session).result()
1045 5
        if final:
1046 5
            finals[final[0]] = final[1]
1047 5
    return finals
1048
1049
1050 5
def devalpha_urls_bootstrap(osversion, skeletons, session=None):
1051
    """
1052
    Get list of valid Dev Alpha autoloader URLs.
1053
1054
    :param osversion: OS version.
1055
    :type osversion: str
1056
1057
    :param skeletons: List of skeleton formats to try.
1058
    :type skeletons: list
1059
1060
    :param session: Requests session object, default is created on the fly.
1061
    :type session: requests.Session()
1062
    """
1063 5
    with concurrent.futures.ThreadPoolExecutor(max_workers=5) as xec:
1064 5
        try:
1065 5
            return devalpha_urls_bulk(osversion, skeletons, xec, session)
1066
        except KeyboardInterrupt:
1067
            xec.shutdown(wait=False)
1068
1069
1070 5
def dev_dupe_dicter(finals):
1071
    """
1072
    Prepare dictionary to clean duplicate autoloaders.
1073
1074
    :param finals: Dict of URL:content-length pairs.
1075
    :type finals: dict(str: str)
1076
    """
1077 5
    revo = {}
1078 5
    for key, val in finals.items():
1079 5
        revo.setdefault(val, set()).add(key)
1080 5
    return revo
1081
1082
1083 5
def dev_dupe_remover(finals, dupelist):
1084
    """
1085
    Filter dictionary of autoloader entries.
1086
1087
    :param finals: Dict of URL:content-length pairs.
1088
    :type finals: dict(str: str)
1089
1090
    :param dupelist: List of duplicate URLs.
1091
    :type duplist: list(str)
1092
    """
1093 5
    for dupe in dupelist:
1094 5
        for entry in dupe:
1095 5
            if "DevAlpha" in entry:
1096 5
                del finals[entry]
1097 5
    return finals
1098
1099
1100 5
def dev_dupe_cleaner(finals):
1101
    """
1102
    Clean duplicate autoloader entries.
1103
1104
    :param finals: Dict of URL:content-length pairs.
1105
    :type finals: dict(str: str)
1106
    """
1107 5
    revo = dev_dupe_dicter(finals)
1108 5
    dupelist = [val for key, val in revo.items() if len(val) > 1]
1109 5
    finals = dev_dupe_remover(finals, dupelist)
1110
    return finals
1111