httpie-cli/tests/test_downloads.py

import os
import tempfile
import time
from unittest import mock
from urllib.request import urlopen

import pytest
from requests.structures import CaseInsensitiveDict

from httpie.downloads import (
    parse_content_range, filename_from_content_disposition, filename_from_url,
    get_unique_filename, ContentRangeError, Downloader,
)
from .utils import http, MockEnvironment


class Response:
    # noinspection PyDefaultArgument
    def __init__(self, url, headers={}, status_code=200):
        self.url = url
        self.headers = CaseInsensitiveDict(headers)
        self.status_code = status_code


class TestDownloadUtils:

    def test_Content_Range_parsing(self):
        parse = parse_content_range

        assert parse('bytes 100-199/200', 100) == 200
        assert parse('bytes 100-199/*', 100) == 200

        # single byte
        assert parse('bytes 100-100/*', 100) == 101

        # missing
        pytest.raises(ContentRangeError, parse, None, 100)

        # syntax error
        pytest.raises(ContentRangeError, parse, 'beers 100-199/*', 100)

        # unexpected range
        pytest.raises(ContentRangeError, parse, 'bytes 100-199/*', 99)

        # invalid instance-length
        pytest.raises(ContentRangeError, parse, 'bytes 100-199/199', 100)

        # invalid byte-range-resp-spec
        pytest.raises(ContentRangeError, parse, 'bytes 100-99/199', 100)

    @pytest.mark.parametrize('header, expected_filename', [
        ('attachment; filename=hello-WORLD_123.txt', 'hello-WORLD_123.txt'),
        ('attachment; filename=".hello-WORLD_123.txt"', 'hello-WORLD_123.txt'),
        ('attachment; filename="white space.txt"', 'white space.txt'),
        (r'attachment; filename="\"quotes\".txt"', '"quotes".txt'),
        ('attachment; filename=/etc/hosts', 'hosts'),
        ('attachment; filename=', None)
    ])
    def test_Content_Disposition_parsing(self, header, expected_filename):
        assert filename_from_content_disposition(header) == expected_filename

    def test_filename_from_url(self):
        assert 'foo.txt' == filename_from_url(
            url='http://example.org/foo',
            content_type='text/plain'
        )
        assert 'foo.html' == filename_from_url(
            url='http://example.org/foo',
            content_type='text/html; charset=utf8'
        )
        assert 'foo' == filename_from_url(
            url='http://example.org/foo',
            content_type=None
        )
        assert 'foo' == filename_from_url(
            url='http://example.org/foo',
            content_type='x-foo/bar'
        )

    @pytest.mark.parametrize(
        'orig_name, unique_on_attempt, expected',
        [
            # Simple
            ('foo.bar', 0, 'foo.bar'),
            ('foo.bar', 1, 'foo.bar-1'),
            ('foo.bar', 10, 'foo.bar-10'),
            # Trim
            ('A' * 20, 0, 'A' * 10),
            ('A' * 20, 1, 'A' * 8 + '-1'),
            ('A' * 20, 10, 'A' * 7 + '-10'),
            # Trim before ext
            ('A' * 20 + '.txt', 0, 'A' * 6 + '.txt'),
            ('A' * 20 + '.txt', 1, 'A' * 4 + '.txt-1'),
            # Trim at the end
            ('foo.' + 'A' * 20, 0, 'foo.' + 'A' * 6),
            ('foo.' + 'A' * 20, 1, 'foo.' + 'A' * 4 + '-1'),
            ('foo.' + 'A' * 20, 10, 'foo.' + 'A' * 3 + '-10'),
        ]
    )
    @mock.patch('httpie.downloads.get_filename_max_length')
    def test_unique_filename(self, get_filename_max_length,
                             orig_name, unique_on_attempt,
                             expected):

        def attempts(unique_on_attempt=0):
            # noinspection PyUnresolvedReferences,PyUnusedLocal
            def exists(filename):
                if exists.attempt == unique_on_attempt:
                    return False
                exists.attempt += 1
                return True

            exists.attempt = 0
            return exists

        get_filename_max_length.return_value = 10

        actual = get_unique_filename(orig_name, attempts(unique_on_attempt))
        assert expected == actual


class TestDownloads:
    # TODO: more tests

    def test_actual_download(self, httpbin_both, httpbin):
        robots_txt = '/robots.txt'
        body = urlopen(httpbin + robots_txt).read().decode()
        env = MockEnvironment(stdin_isatty=True, stdout_isatty=False)
        r = http('--download', httpbin_both.url + robots_txt, env=env)
        assert 'Downloading' in r.stderr
        assert '[K' in r.stderr
        assert 'Done' in r.stderr
        assert body == r

    def test_download_with_Content_Length(self, httpbin_both):
        with open(os.devnull, 'w') as devnull:
            downloader = Downloader(output_file=devnull, progress_file=devnull)
            downloader.start(
                initial_url='/',
                final_response=Response(
                    url=httpbin_both.url + '/',
                    headers={'Content-Length': 10}
                )
            )
            time.sleep(1.1)
            downloader.chunk_downloaded(b'12345')
            time.sleep(1.1)
            downloader.chunk_downloaded(b'12345')
            downloader.finish()
            assert not downloader.interrupted
            downloader._progress_reporter.join()

    def test_download_no_Content_Length(self, httpbin_both):
        with open(os.devnull, 'w') as devnull:
            downloader = Downloader(output_file=devnull, progress_file=devnull)
            downloader.start(
                final_response=Response(url=httpbin_both.url + '/'),
                initial_url='/'
            )
            time.sleep(1.1)
            downloader.chunk_downloaded(b'12345')
            downloader.finish()
            assert not downloader.interrupted
            downloader._progress_reporter.join()

    def test_download_interrupted(self, httpbin_both):
        with open(os.devnull, 'w') as devnull:
            downloader = Downloader(output_file=devnull, progress_file=devnull)
            downloader.start(
                final_response=Response(
                    url=httpbin_both.url + '/',
                    headers={'Content-Length': 5}
                ),
                initial_url='/'
            )
            downloader.chunk_downloaded(b'1234')
            downloader.finish()
            assert downloader.interrupted
            downloader._progress_reporter.join()

    def test_download_with_redirect_original_url_used_for_filename(self, httpbin):
        # Redirect from `/redirect/1` to `/get`.
        expected_filename = '1.json'
        orig_cwd = os.getcwd()
        with tempfile.TemporaryDirectory() as tmp_dirname:
            os.chdir(tmp_dirname)
            try:
                assert os.listdir('.') == []
                http('--download', httpbin.url + '/redirect/1')
                assert os.listdir('.') == [expected_filename]
            finally:
                os.chdir(orig_cwd)
Refactored tests into smaller modules. 2014-04-24 14:07:31 +02:00			`import os`
Changed the way the output filename is generated When ``--download`` without ``--output`` results in a redirect, now only the initial URL is considered, not the final one. 2019-06-24 12:19:29 +02:00			`import tempfile`
Refactored tests into smaller modules. 2014-04-24 14:07:31 +02:00			`import time`
Replace usage of mock with unittest.mock (#1054) Since Python 3, the mock dependency is no more required as it is already part of the unittest module. 2021-04-30 15:08:27 +02:00			`from unittest import mock`
Python 2.7 support removal WIP 2019-08-29 08:53:56 +02:00			`from urllib.request import urlopen`
Refactored tests into smaller modules. 2014-04-24 14:07:31 +02:00
Finished pytest migration. 2014-04-24 17:08:40 +02:00			`import pytest`
Cleanup XX 2014-04-24 15:48:01 +02:00			`from requests.structures import CaseInsensitiveDict`

Refactored tests into smaller modules. 2014-04-24 14:07:31 +02:00			`from httpie.downloads import (`
Added CONTRIBUTING.rst. 2014-04-24 18:20:23 +02:00			`parse_content_range, filename_from_content_disposition, filename_from_url,`
Refactoring 2016-02-29 08:00:17 +01:00			`get_unique_filename, ContentRangeError, Downloader,`
Refactored tests into smaller modules. 2014-04-24 14:07:31 +02:00			`)`
Use relative imports (#1057) * Use relative imports in test * Use relative imports * Add myself to contributors :) 2021-05-05 14:13:39 +02:00			`from .utils import http, MockEnvironment`
Refactored tests into smaller modules. 2014-04-24 14:07:31 +02:00

Python 3 annotations, super(), pathlib, etc. 2019-08-30 11:32:14 +02:00			`class Response:`
Cleanup XX 2014-04-24 15:48:01 +02:00			`# noinspection PyDefaultArgument`
			`def __init__(self, url, headers={}, status_code=200):`
			`self.url = url`
			`self.headers = CaseInsensitiveDict(headers)`
			`self.status_code = status_code`
Refactored tests into smaller modules. 2014-04-24 14:07:31 +02:00

Removed last dependencies on unittest. All tests are pytest-only. 2014-04-25 11:39:59 +02:00			`class TestDownloadUtils:`
Changed the way the output filename is generated When ``--download`` without ``--output`` results in a redirect, now only the initial URL is considered, not the final one. 2019-06-24 12:19:29 +02:00
Cleanup XX 2014-04-24 15:48:01 +02:00			`def test_Content_Range_parsing(self):`
Refactored tests into smaller modules. 2014-04-24 14:07:31 +02:00			`parse = parse_content_range`

Converted all unittest asserts to plain, pytest-powered asserts. 2014-04-24 14:58:15 +02:00			`assert parse('bytes 100-199/200', 100) == 200`
			`assert parse('bytes 100-199/*', 100) == 200`
Refactored tests into smaller modules. 2014-04-24 14:07:31 +02:00
Correctly handle single-byte Content-Range (#1032) HTTPie previously failed if it continued a download with a single byte left. 2021-02-14 13:30:58 +01:00			`# single byte`
			`assert parse('bytes 100-100/*', 100) == 101`

Refactored tests into smaller modules. 2014-04-24 14:07:31 +02:00			`# missing`
Finished pytest migration. 2014-04-24 17:08:40 +02:00			`pytest.raises(ContentRangeError, parse, None, 100)`
Refactored tests into smaller modules. 2014-04-24 14:07:31 +02:00
			`# syntax error`
Finished pytest migration. 2014-04-24 17:08:40 +02:00			`pytest.raises(ContentRangeError, parse, 'beers 100-199/*', 100)`
Refactored tests into smaller modules. 2014-04-24 14:07:31 +02:00
			`# unexpected range`
Finished pytest migration. 2014-04-24 17:08:40 +02:00			`pytest.raises(ContentRangeError, parse, 'bytes 100-199/*', 99)`
Refactored tests into smaller modules. 2014-04-24 14:07:31 +02:00
			`# invalid instance-length`
Finished pytest migration. 2014-04-24 17:08:40 +02:00			`pytest.raises(ContentRangeError, parse, 'bytes 100-199/199', 100)`
Refactored tests into smaller modules. 2014-04-24 14:07:31 +02:00
			`# invalid byte-range-resp-spec`
Finished pytest migration. 2014-04-24 17:08:40 +02:00			`pytest.raises(ContentRangeError, parse, 'bytes 100-99/199', 100)`
Refactored tests into smaller modules. 2014-04-24 14:07:31 +02:00
Removed last dependencies on unittest. All tests are pytest-only. 2014-04-25 11:39:59 +02:00			`@pytest.mark.parametrize('header, expected_filename', [`
			`('attachment; filename=hello-WORLD_123.txt', 'hello-WORLD_123.txt'),`
			`('attachment; filename=".hello-WORLD_123.txt"', 'hello-WORLD_123.txt'),`
			`('attachment; filename="white space.txt"', 'white space.txt'),`
			`(r'attachment; filename="\"quotes\".txt"', '"quotes".txt'),`
			`('attachment; filename=/etc/hosts', 'hosts'),`
			`('attachment; filename=', None)`
			`])`
			`def test_Content_Disposition_parsing(self, header, expected_filename):`
			`assert filename_from_content_disposition(header) == expected_filename`
Refactored tests into smaller modules. 2014-04-24 14:07:31 +02:00
			`def test_filename_from_url(self):`
Converted all unittest asserts to plain, pytest-powered asserts. 2014-04-24 14:58:15 +02:00			`assert 'foo.txt' == filename_from_url(`
Refactored tests into smaller modules. 2014-04-24 14:07:31 +02:00			`url='http://example.org/foo',`
			`content_type='text/plain'`
Converted all unittest asserts to plain, pytest-powered asserts. 2014-04-24 14:58:15 +02:00			`)`
			`assert 'foo.html' == filename_from_url(`
Refactored tests into smaller modules. 2014-04-24 14:07:31 +02:00			`url='http://example.org/foo',`
			`content_type='text/html; charset=utf8'`
Converted all unittest asserts to plain, pytest-powered asserts. 2014-04-24 14:58:15 +02:00			`)`
			`assert 'foo' == filename_from_url(`
Refactored tests into smaller modules. 2014-04-24 14:07:31 +02:00			`url='http://example.org/foo',`
			`content_type=None`
Converted all unittest asserts to plain, pytest-powered asserts. 2014-04-24 14:58:15 +02:00			`)`
			`assert 'foo' == filename_from_url(`
Refactored tests into smaller modules. 2014-04-24 14:07:31 +02:00			`url='http://example.org/foo',`
			`content_type='x-foo/bar'`
Converted all unittest asserts to plain, pytest-powered asserts. 2014-04-24 14:58:15 +02:00			`)`
Refactored tests into smaller modules. 2014-04-24 14:07:31 +02:00
Fixed #451 - OSError: [Errno 36] File name too long 2016-03-17 08:58:01 +01:00			`@pytest.mark.parametrize(`
			`'orig_name, unique_on_attempt, expected',`
			`[`
			`# Simple`
			`('foo.bar', 0, 'foo.bar'),`
			`('foo.bar', 1, 'foo.bar-1'),`
			`('foo.bar', 10, 'foo.bar-10'),`
			`# Trim`
			`('A' * 20, 0, 'A' * 10),`
			`('A' * 20, 1, 'A' * 8 + '-1'),`
			`('A' * 20, 10, 'A' * 7 + '-10'),`
			`# Trim before ext`
			`('A' * 20 + '.txt', 0, 'A' * 6 + '.txt'),`
			`('A' * 20 + '.txt', 1, 'A' * 4 + '.txt-1'),`
			`# Trim at the end`
			`('foo.' + 'A' * 20, 0, 'foo.' + 'A' * 6),`
			`('foo.' + 'A' * 20, 1, 'foo.' + 'A' * 4 + '-1'),`
			`('foo.' + 'A' * 20, 10, 'foo.' + 'A' * 3 + '-10'),`
			`]`
			`)`
			`@mock.patch('httpie.downloads.get_filename_max_length')`
			`def test_unique_filename(self, get_filename_max_length,`
			`orig_name, unique_on_attempt,`
			`expected):`

Cleanup XX 2014-04-24 15:48:01 +02:00			`def attempts(unique_on_attempt=0):`
Refactored tests into smaller modules. 2014-04-24 14:07:31 +02:00			`# noinspection PyUnresolvedReferences,PyUnusedLocal`
			`def exists(filename):`
			`if exists.attempt == unique_on_attempt:`
			`return False`
			`exists.attempt += 1`
			`return True`
Cleanup XX 2014-04-24 15:48:01 +02:00
Refactored tests into smaller modules. 2014-04-24 14:07:31 +02:00			`exists.attempt = 0`
			`return exists`

Fixed #451 - OSError: [Errno 36] File name too long 2016-03-17 08:58:01 +01:00			`get_filename_max_length.return_value = 10`

			`actual = get_unique_filename(orig_name, attempts(unique_on_attempt))`
			`assert expected == actual`
Refactored tests into smaller modules. 2014-04-24 14:07:31 +02:00

Removed last dependencies on unittest. All tests are pytest-only. 2014-04-25 11:39:59 +02:00			`class TestDownloads:`
Refactored tests into smaller modules. 2014-04-24 14:07:31 +02:00			`# TODO: more tests`

Run tests against both HTTP and HTTPS Some of the tests now use the `httpbin_both` fixture from pytest-httpbin. Also, made httpbin's CA trusted by default and added `httpbin_secure_untrusted` fixture to allow overriding that for particular tests. 2016-03-06 10:42:35 +01:00			`def test_actual_download(self, httpbin_both, httpbin):`
			`robots_txt = '/robots.txt'`
			`body = urlopen(httpbin + robots_txt).read().decode()`
Rename `TestEnvironment` to `MockEnvironment` to avoid pytest warnings Close #621 2017-12-28 18:17:48 +01:00			`env = MockEnvironment(stdin_isatty=True, stdout_isatty=False)`
Run tests against both HTTP and HTTPS Some of the tests now use the `httpbin_both` fixture from pytest-httpbin. Also, made httpbin's CA trusted by default and added `httpbin_secure_untrusted` fixture to allow overriding that for particular tests. 2016-03-06 10:42:35 +01:00			`r = http('--download', httpbin_both.url + robots_txt, env=env)`
Converted all unittest asserts to plain, pytest-powered asserts. 2014-04-24 14:58:15 +02:00			`assert 'Downloading' in r.stderr`
			`assert '[K' in r.stderr`
			`assert 'Done' in r.stderr`
			`assert body == r`
Refactored tests into smaller modules. 2014-04-24 14:07:31 +02:00
Run tests against both HTTP and HTTPS Some of the tests now use the `httpbin_both` fixture from pytest-httpbin. Also, made httpbin's CA trusted by default and added `httpbin_secure_untrusted` fixture to allow overriding that for particular tests. 2016-03-06 10:42:35 +01:00			`def test_download_with_Content_Length(self, httpbin_both):`
Fix several ResourceWarning: unclosed file (#741) Signed-off-by: Mickaël Schoentgen <contact@tiger-222.fr> 2019-02-04 10:00:30 +01:00			`with open(os.devnull, 'w') as devnull:`
			`downloader = Downloader(output_file=devnull, progress_file=devnull)`
Add one-by-one processing of each HTTP request or response and --offline 2019-09-03 17:14:39 +02:00			`downloader.start(`
			`initial_url='/',`
			`final_response=Response(`
			`url=httpbin_both.url + '/',`
			`headers={'Content-Length': 10}`
			`)`
			`)`
Fix several ResourceWarning: unclosed file (#741) Signed-off-by: Mickaël Schoentgen <contact@tiger-222.fr> 2019-02-04 10:00:30 +01:00			`time.sleep(1.1)`
			`downloader.chunk_downloaded(b'12345')`
			`time.sleep(1.1)`
			`downloader.chunk_downloaded(b'12345')`
			`downloader.finish()`
			`assert not downloader.interrupted`
			`downloader._progress_reporter.join()`
Refactored tests into smaller modules. 2014-04-24 14:07:31 +02:00
Run tests against both HTTP and HTTPS Some of the tests now use the `httpbin_both` fixture from pytest-httpbin. Also, made httpbin's CA trusted by default and added `httpbin_secure_untrusted` fixture to allow overriding that for particular tests. 2016-03-06 10:42:35 +01:00			`def test_download_no_Content_Length(self, httpbin_both):`
Fix several ResourceWarning: unclosed file (#741) Signed-off-by: Mickaël Schoentgen <contact@tiger-222.fr> 2019-02-04 10:00:30 +01:00			`with open(os.devnull, 'w') as devnull:`
			`downloader = Downloader(output_file=devnull, progress_file=devnull)`
Add one-by-one processing of each HTTP request or response and --offline 2019-09-03 17:14:39 +02:00			`downloader.start(`
			`final_response=Response(url=httpbin_both.url + '/'),`
			`initial_url='/'`
			`)`
Fix several ResourceWarning: unclosed file (#741) Signed-off-by: Mickaël Schoentgen <contact@tiger-222.fr> 2019-02-04 10:00:30 +01:00			`time.sleep(1.1)`
			`downloader.chunk_downloaded(b'12345')`
			`downloader.finish()`
			`assert not downloader.interrupted`
			`downloader._progress_reporter.join()`
Refactored tests into smaller modules. 2014-04-24 14:07:31 +02:00
Run tests against both HTTP and HTTPS Some of the tests now use the `httpbin_both` fixture from pytest-httpbin. Also, made httpbin's CA trusted by default and added `httpbin_secure_untrusted` fixture to allow overriding that for particular tests. 2016-03-06 10:42:35 +01:00			`def test_download_interrupted(self, httpbin_both):`
Fix several ResourceWarning: unclosed file (#741) Signed-off-by: Mickaël Schoentgen <contact@tiger-222.fr> 2019-02-04 10:00:30 +01:00			`with open(os.devnull, 'w') as devnull:`
			`downloader = Downloader(output_file=devnull, progress_file=devnull)`
Add one-by-one processing of each HTTP request or response and --offline 2019-09-03 17:14:39 +02:00			`downloader.start(`
			`final_response=Response(`
			`url=httpbin_both.url + '/',`
			`headers={'Content-Length': 5}`
			`),`
			`initial_url='/'`
			`)`
Fix several ResourceWarning: unclosed file (#741) Signed-off-by: Mickaël Schoentgen <contact@tiger-222.fr> 2019-02-04 10:00:30 +01:00			`downloader.chunk_downloaded(b'1234')`
			`downloader.finish()`
			`assert downloader.interrupted`
			`downloader._progress_reporter.join()`
Changed the way the output filename is generated When ``--download`` without ``--output`` results in a redirect, now only the initial URL is considered, not the final one. 2019-06-24 12:19:29 +02:00
			`def test_download_with_redirect_original_url_used_for_filename(self, httpbin):`
			# Redirect from `/redirect/1` to `/get`.
			`expected_filename = '1.json'`
			`orig_cwd = os.getcwd()`
Finish `--quiet` 2020-08-15 15:25:05 +02:00			`with tempfile.TemporaryDirectory() as tmp_dirname:`
			`os.chdir(tmp_dirname)`
			`try:`
			`assert os.listdir('.') == []`
			`http('--download', httpbin.url + '/redirect/1')`
			`assert os.listdir('.') == [expected_filename]`
			`finally:`
			`os.chdir(orig_cwd)`