2015-11-29 09:22:03 +00:00
|
|
|
"""An example of wrapping manual tqdm updates for urllib reporthook.
|
2015-09-14 15:28:07 +00:00
|
|
|
|
|
|
|
# urllib.urlretrieve documentation
|
|
|
|
> If present, the hook function will be called once
|
|
|
|
> on establishment of the network connection and once after each block read
|
|
|
|
> thereafter. The hook will be passed three arguments; a count of blocks
|
|
|
|
> transferred so far, a block size in bytes, and the total size of the file.
|
|
|
|
|
|
|
|
Usage:
|
|
|
|
tqdm_wget.py [options]
|
|
|
|
|
|
|
|
Options:
|
2015-11-29 09:22:03 +00:00
|
|
|
-h, --help
|
|
|
|
Print this help message and exit
|
2015-09-14 15:28:07 +00:00
|
|
|
-u URL, --url URL : string, optional
|
|
|
|
The url to fetch.
|
2017-05-28 22:43:13 +00:00
|
|
|
[default: https://caspersci.uk.to/matryoshka.zip]
|
2015-09-14 15:28:07 +00:00
|
|
|
-o FILE, --output FILE : string, optional
|
|
|
|
The local file path in which to save the url [default: /dev/null].
|
|
|
|
"""
|
|
|
|
|
|
|
|
import urllib
|
2017-05-28 22:43:13 +00:00
|
|
|
from os import devnull
|
2015-09-14 15:28:07 +00:00
|
|
|
from tqdm import tqdm
|
|
|
|
from docopt import docopt
|
|
|
|
|
|
|
|
|
2015-11-29 09:22:03 +00:00
|
|
|
def my_hook(t):
|
2017-05-29 14:58:28 +00:00
|
|
|
"""Wraps tqdm instance.
|
|
|
|
|
|
|
|
Don't forget to close() or __exit__()
|
2015-11-29 09:22:03 +00:00
|
|
|
the tqdm instance once you're done with it (easiest using `with` syntax).
|
|
|
|
|
|
|
|
Example
|
|
|
|
-------
|
|
|
|
|
|
|
|
>>> with tqdm(...) as t:
|
|
|
|
... reporthook = my_hook(t)
|
|
|
|
... urllib.urlretrieve(..., reporthook=reporthook)
|
|
|
|
|
|
|
|
"""
|
2015-09-14 15:28:07 +00:00
|
|
|
last_b = [0]
|
|
|
|
|
2017-05-29 14:58:28 +00:00
|
|
|
def update_to(b=1, bsize=1, tsize=None):
|
2015-11-29 09:22:03 +00:00
|
|
|
"""
|
2015-09-14 15:28:07 +00:00
|
|
|
b : int, optional
|
2017-05-29 14:58:28 +00:00
|
|
|
Number of blocks transferred so far [default: 1].
|
2015-09-14 15:28:07 +00:00
|
|
|
bsize : int, optional
|
|
|
|
Size of each block (in tqdm units) [default: 1].
|
|
|
|
tsize : int, optional
|
|
|
|
Total size (in tqdm units). If [default: None] remains unchanged.
|
2015-11-29 09:22:03 +00:00
|
|
|
"""
|
2015-09-14 15:28:07 +00:00
|
|
|
if tsize is not None:
|
|
|
|
t.total = tsize
|
|
|
|
t.update((b - last_b[0]) * bsize)
|
|
|
|
last_b[0] = b
|
2017-08-28 11:42:38 +00:00
|
|
|
|
2017-05-29 14:58:28 +00:00
|
|
|
return update_to
|
|
|
|
|
|
|
|
|
|
|
|
class TqdmUpTo(tqdm):
|
|
|
|
"""Alternative Class-based version of the above.
|
|
|
|
|
|
|
|
Provides `update_to(n)` which uses `tqdm.update(delta_n)`.
|
|
|
|
|
|
|
|
Inspired by [twine#242](https://github.com/pypa/twine/pull/242),
|
|
|
|
[here](https://github.com/pypa/twine/commit/42e55e06).
|
|
|
|
"""
|
2017-08-28 11:42:38 +00:00
|
|
|
|
2017-05-29 14:58:28 +00:00
|
|
|
def update_to(self, b=1, bsize=1, tsize=None):
|
|
|
|
"""
|
|
|
|
b : int, optional
|
|
|
|
Number of blocks transferred so far [default: 1].
|
|
|
|
bsize : int, optional
|
|
|
|
Size of each block (in tqdm units) [default: 1].
|
|
|
|
tsize : int, optional
|
|
|
|
Total size (in tqdm units). If [default: None] remains unchanged.
|
|
|
|
"""
|
|
|
|
if tsize is not None:
|
|
|
|
self.total = tsize
|
|
|
|
self.update(b * bsize - self.n) # will also set self.n = b * bsize
|
2015-09-14 15:28:07 +00:00
|
|
|
|
|
|
|
|
|
|
|
opts = docopt(__doc__)
|
|
|
|
|
|
|
|
eg_link = opts['--url']
|
|
|
|
eg_file = eg_link.replace('/', ' ').split()[-1]
|
2017-05-28 22:43:13 +00:00
|
|
|
eg_out = opts['--output'].replace("/dev/null", devnull)
|
2017-03-06 01:42:17 +00:00
|
|
|
# with tqdm(unit='B', unit_scale=True, unit_divisor=1024, miniters=1,
|
2017-05-29 14:58:28 +00:00
|
|
|
# desc=eg_file) as t: # all optional kwargs
|
|
|
|
# urllib.urlretrieve(eg_link, filename=eg_out,
|
|
|
|
# reporthook=my_hook(t), data=None)
|
2017-03-06 01:42:17 +00:00
|
|
|
with TqdmUpTo(unit='B', unit_scale=True, unit_divisor=1024, miniters=1,
|
2017-05-29 14:58:28 +00:00
|
|
|
desc=eg_file) as t: # all optional kwargs
|
2017-08-28 11:42:38 +00:00
|
|
|
urllib.urlretrieve(eg_link, filename=eg_out, reporthook=t.update_to,
|
|
|
|
data=None)
|