httpie-cli/httpie/output.py

"""Output processing and formatting.

"""
import re
import json

import pygments
from pygments import token, lexer
from pygments.styles import get_style_by_name, STYLE_MAP
from pygments.lexers import get_lexer_for_mimetype
from pygments.formatters.terminal import TerminalFormatter
from pygments.formatters.terminal256 import Terminal256Formatter
from pygments.util import ClassNotFound
from requests.compat import is_windows

from . import solarized
from .models import Environment


DEFAULT_STYLE = 'solarized'
AVAILABLE_STYLES = [DEFAULT_STYLE] + list(STYLE_MAP.keys())
BINARY_SUPPRESSED_NOTICE = (
    '+-----------------------------------------+\n'
    '| NOTE: binary data not shown in terminal |\n'
    '+-----------------------------------------+'
)


def format(msg, prettifier=None, with_headers=True, with_body=True,
           env=Environment()):
    """Return a UTF8-encoded representation of a `models.HTTPMessage`.

    Sometimes the body contains binary data so we always return `bytes`.

    If `prettifier` is set or the output is a terminal then a binary
    body is not included in the output and is replaced with notice.

    Generally, when the `stdout` is redirected, the output matches the actual
    message as much as possible. When `--pretty` set (or implied),
    or when the output is a terminal, then we prefer readability over
    precision.

    """

    # Output encoding.
    if env.stdout_isatty:
        # Use encoding suitable for the terminal. Unsupported characters
        # will be replaced in the output.
        errors = 'replace'
        output_encoding = getattr(env.stdout, 'encoding', None)
    else:
        # Preserve the message encoding.
        errors = 'strict'
        output_encoding = msg.encoding
    if not output_encoding:
        # Default to utf8
        output_encoding = 'utf8'

    if prettifier:
        env.init_colors()

    #noinspection PyArgumentList
    output = bytearray()

    if with_headers:
        headers = '\n'.join([msg.line, msg.headers])

        if prettifier:
            headers = prettifier.process_headers(headers)

        output.extend(
            headers.encode(output_encoding, errors).strip())

        if with_body and msg.body:
            output.extend(b'\n\n')

    if with_body and msg.body:

        body = msg.body

        if not (env.stdout_isatty or prettifier):
            # Verbatim body even if it's binary.
            pass
        else:
            try:
                body = body.decode(msg.encoding)
            except UnicodeDecodeError:
                # Suppress binary data.
                body = BINARY_SUPPRESSED_NOTICE.encode(output_encoding)
                if not with_headers:
                    output.extend(b'\n')
            else:
                if prettifier and msg.content_type:
                    body = prettifier.process_body(
                        body, msg.content_type).strip()

                body = body.encode(output_encoding, errors)

        output.extend(body)

    return bytes(output)


class HTTPLexer(lexer.RegexLexer):
    """Simplified HTTP lexer for Pygments.

    It only operates on headers and provides a stronger contrast between
    their names and values than the original one bundled with Pygments
    (`pygments.lexers.text import HttpLexer`), especially when
    Solarized color scheme is used.

    """
    name = 'HTTP'
    aliases = ['http']
    filenames = ['*.http']
    tokens = {
        'root': [

            # Request-Line
            (r'([A-Z]+)( +)([^ ]+)( +)(HTTP)(/)(\d+\.\d+)',
             lexer.bygroups(
                token.Name.Function,
                token.Text,
                token.Name.Namespace,
                token.Text,
                token.Keyword.Reserved,
                token.Operator,
                token.Number
             )),

            # Response Status-Line
            (r'(HTTP)(/)(\d+\.\d+)( +)(\d{3})( +)(.+)',
             lexer.bygroups(
                 token.Keyword.Reserved,  # 'HTTP'
                 token.Operator,  # '/'
                 token.Number,  # Version
                 token.Text,
                 token.Number,  # Status code
                 token.Text,
                 token.Name.Exception,  # Reason
             )),

            # Header
            (r'(.*?)( *)(:)( *)(.+)', lexer.bygroups(
                token.Name.Attribute, # Name
                token.Text,
                token.Operator,  # Colon
                token.Text,
                token.String  # Value
            ))
    ]}


class BaseProcessor(object):

    enabled = True

    def __init__(self, env, **kwargs):
        self.env = env
        self.kwargs = kwargs

    def process_headers(self, headers):
        return headers

    def process_body(self, content, content_type):
        return content


class JSONProcessor(BaseProcessor):

    def process_body(self, content, content_type):
        if content_type == 'application/json':
            try:
                # Indent and sort the JSON data.
                content = json.dumps(
                    json.loads(content),
                    sort_keys=True,
                    ensure_ascii=False,
                    indent=4,
                )
            except ValueError:
                # Invalid JSON - we don't care.
                pass
        return content


class PygmentsProcessor(BaseProcessor):

    def __init__(self, *args, **kwargs):
        super(PygmentsProcessor, self).__init__(*args, **kwargs)

        if not self.env.colors:
            self.enabled = False
            return

        try:
            style = get_style_by_name(
                self.kwargs.get('pygments_style', DEFAULT_STYLE))
        except ClassNotFound:
            style = solarized.SolarizedStyle

        if is_windows or self.env.colors == 256:
            fmt_class = Terminal256Formatter
        else:
            fmt_class = TerminalFormatter
        self.formatter = fmt_class(style=style)

    def process_headers(self, headers):
        return pygments.highlight(
            headers, HTTPLexer(), self.formatter)

    def process_body(self, content, content_type):
        try:
            lexer = get_lexer_for_mimetype(content_type)
        except ClassNotFound:
            pass
        else:
            content = pygments.highlight(content, lexer, self.formatter)
        return content


class OutputProcessor(object):

    installed_processors = [
        JSONProcessor,
        PygmentsProcessor
    ]

    def __init__(self, env, **kwargs):
        processors = [
            cls(env, **kwargs)
            for cls in self.installed_processors
        ]
        self.processors = [p for p in processors if p.enabled]

    def process_headers(self, headers):
        for processor in self.processors:
         headers = processor.process_headers(headers)
        return headers

    def process_body(self, content, content_type):
        content_type = content_type.split(';')[0]

        application_match = re.match(
            r'application/(.+\+)(json|xml)$',
            content_type
        )
        if application_match:
            # Strip vendor and extensions from Content-Type
            vendor, extension = application_match.groups()
            content_type = content_type.replace(vendor, '')

        for processor in self.processors:
            content = processor.process_body(content, content_type)

        return content
Added docstrings, refactored input. 2012-07-26 06:37:03 +02:00			`"""Output processing and formatting.`
Improved highlighting of HTTP headers. Closes #60. 2012-07-20 21:54:41 +02:00
			`"""`
Simplify vendor extension content-types since they are most likely lexable 2012-07-14 16:27:11 +02:00			`import re`
Initial commit. 2012-02-25 13:39:38 +01:00			`import json`
Clean-up 2012-07-26 00:26:23 +02:00
Initial commit. 2012-02-25 13:39:38 +01:00			`import pygments`
Improved highlighting of HTTP headers. Closes #60. 2012-07-20 21:54:41 +02:00			`from pygments import token, lexer`
PEP-8 2012-04-28 14:18:59 +02:00			`from pygments.styles import get_style_by_name, STYLE_MAP`
Improved highlighting of HTTP headers. Closes #60. 2012-07-20 21:54:41 +02:00			`from pygments.lexers import get_lexer_for_mimetype`
use PrettyHttp class; working --headers and --body 2012-04-28 14:13:40 +02:00			`from pygments.formatters.terminal import TerminalFormatter`
Improved highlighting of HTTP headers. Closes #60. 2012-07-20 21:54:41 +02:00			`from pygments.formatters.terminal256 import Terminal256Formatter`
			`from pygments.util import ClassNotFound`
Send filenames with multipart/form-data file uploads. 2012-07-28 13:24:44 +02:00			`from requests.compat import is_windows`
Clean-up 2012-07-26 00:26:23 +02:00
Added the option to print the request It is now possible to print any combination of the following request-response bits: - Request headers (H) - Request body (B) - Response headers (h) - Response body (b) The output is controlled by the --print / -p option which defaults to "hb" (i.e., response headers and response body). Note that -p was previously shortcut for --prety. Closes #29. 2012-03-14 00:05:44 +01:00			`from . import solarized`
Fixed multipart requests output; binary support. * Bodies of multipart requests are correctly printed (closes #30). * Binary requests and responses should always work (they are also suppressed for terminal output). So things like this work:: http www.google.com/favicon.ico > favicon.ico 2012-07-28 05:45:44 +02:00			`from .models import Environment`
Initial commit. 2012-02-25 13:39:38 +01:00
Improved highlighting of HTTP headers. Closes #60. 2012-07-20 21:54:41 +02:00
			`DEFAULT_STYLE = 'solarized'`
			`AVAILABLE_STYLES = [DEFAULT_STYLE] + list(STYLE_MAP.keys())`
Fixed multipart requests output; binary support. * Bodies of multipart requests are correctly printed (closes #30). * Binary requests and responses should always work (they are also suppressed for terminal output). So things like this work:: http www.google.com/favicon.ico > favicon.ico 2012-07-28 05:45:44 +02:00			`BINARY_SUPPRESSED_NOTICE = (`
			`'+-----------------------------------------+\n'`
			`'\| NOTE: binary data not shown in terminal \|\n'`
			`'+-----------------------------------------+'`
			`)`


			`def format(msg, prettifier=None, with_headers=True, with_body=True,`
			`env=Environment()):`
			"""Return a UTF8-encoded representation of a `models.HTTPMessage`.

Removed redundant decode/encode. 2012-07-29 03:52:24 +02:00			Sometimes the body contains binary data so we always return `bytes`.
Fixed multipart requests output; binary support. * Bodies of multipart requests are correctly printed (closes #30). * Binary requests and responses should always work (they are also suppressed for terminal output). So things like this work:: http www.google.com/favicon.ico > favicon.ico 2012-07-28 05:45:44 +02:00
Fixed typos. 2012-07-28 06:09:25 +02:00			If `prettifier` is set or the output is a terminal then a binary
			`body is not included in the output and is replaced with notice.`
Fixed multipart requests output; binary support. * Bodies of multipart requests are correctly printed (closes #30). * Binary requests and responses should always work (they are also suppressed for terminal output). So things like this work:: http www.google.com/favicon.ico > favicon.ico 2012-07-28 05:45:44 +02:00
Fixed typos. 2012-07-28 06:09:25 +02:00			Generally, when the `stdout` is redirected, the output matches the actual
			message as much as possible. When `--pretty` set (or implied),
Fixed multipart requests output; binary support. * Bodies of multipart requests are correctly printed (closes #30). * Binary requests and responses should always work (they are also suppressed for terminal output). So things like this work:: http www.google.com/favicon.ico > favicon.ico 2012-07-28 05:45:44 +02:00			`or when the output is a terminal, then we prefer readability over`
			`precision.`

			`"""`
Revorked output Binary now works everywhere. Also added `--output FILE` for Windows. 2012-07-30 10:58:16 +02:00
			`# Output encoding.`
			`if env.stdout_isatty:`
			`# Use encoding suitable for the terminal. Unsupported characters`
			`# will be replaced in the output.`
			`errors = 'replace'`
			`output_encoding = getattr(env.stdout, 'encoding', None)`
			`else:`
			`# Preserve the message encoding.`
			`errors = 'strict'`
			`output_encoding = msg.encoding`
			`if not output_encoding:`
			`# Default to utf8`
			`output_encoding = 'utf8'`

			`if prettifier:`
			`env.init_colors()`

			`#noinspection PyArgumentList`
			`output = bytearray()`
Fixed multipart requests output; binary support. * Bodies of multipart requests are correctly printed (closes #30). * Binary requests and responses should always work (they are also suppressed for terminal output). So things like this work:: http www.google.com/favicon.ico > favicon.ico 2012-07-28 05:45:44 +02:00
			`if with_headers:`
Removed redundant decode/encode. 2012-07-29 03:52:24 +02:00			`headers = '\n'.join([msg.line, msg.headers])`
Fixed multipart requests output; binary support. * Bodies of multipart requests are correctly printed (closes #30). * Binary requests and responses should always work (they are also suppressed for terminal output). So things like this work:: http www.google.com/favicon.ico > favicon.ico 2012-07-28 05:45:44 +02:00
			`if prettifier:`
Removed redundant decode/encode. 2012-07-29 03:52:24 +02:00			`headers = prettifier.process_headers(headers)`
Fixed multipart requests output; binary support. * Bodies of multipart requests are correctly printed (closes #30). * Binary requests and responses should always work (they are also suppressed for terminal output). So things like this work:: http www.google.com/favicon.ico > favicon.ico 2012-07-28 05:45:44 +02:00
Revorked output Binary now works everywhere. Also added `--output FILE` for Windows. 2012-07-30 10:58:16 +02:00			`output.extend(`
			`headers.encode(output_encoding, errors).strip())`
Fixed multipart requests output; binary support. * Bodies of multipart requests are correctly printed (closes #30). * Binary requests and responses should always work (they are also suppressed for terminal output). So things like this work:: http www.google.com/favicon.ico > favicon.ico 2012-07-28 05:45:44 +02:00
Revorked output Binary now works everywhere. Also added `--output FILE` for Windows. 2012-07-30 10:58:16 +02:00			`if with_body and msg.body:`
			`output.extend(b'\n\n')`
Fixed multipart requests output; binary support. * Bodies of multipart requests are correctly printed (closes #30). * Binary requests and responses should always work (they are also suppressed for terminal output). So things like this work:: http www.google.com/favicon.ico > favicon.ico 2012-07-28 05:45:44 +02:00
			`if with_body and msg.body:`

			`body = msg.body`

Revorked output Binary now works everywhere. Also added `--output FILE` for Windows. 2012-07-30 10:58:16 +02:00			`if not (env.stdout_isatty or prettifier):`
			`# Verbatim body even if it's binary.`
			`pass`
			`else:`
Fixed multipart requests output; binary support. * Bodies of multipart requests are correctly printed (closes #30). * Binary requests and responses should always work (they are also suppressed for terminal output). So things like this work:: http www.google.com/favicon.ico > favicon.ico 2012-07-28 05:45:44 +02:00			`try:`
Revorked output Binary now works everywhere. Also added `--output FILE` for Windows. 2012-07-30 10:58:16 +02:00			`body = body.decode(msg.encoding)`
Fixed multipart requests output; binary support. * Bodies of multipart requests are correctly printed (closes #30). * Binary requests and responses should always work (they are also suppressed for terminal output). So things like this work:: http www.google.com/favicon.ico > favicon.ico 2012-07-28 05:45:44 +02:00			`except UnicodeDecodeError:`
Revorked output Binary now works everywhere. Also added `--output FILE` for Windows. 2012-07-30 10:58:16 +02:00			`# Suppress binary data.`
			`body = BINARY_SUPPRESSED_NOTICE.encode(output_encoding)`
Fixed multipart requests output; binary support. * Bodies of multipart requests are correctly printed (closes #30). * Binary requests and responses should always work (they are also suppressed for terminal output). So things like this work:: http www.google.com/favicon.ico > favicon.ico 2012-07-28 05:45:44 +02:00			`if not with_headers:`
Revorked output Binary now works everywhere. Also added `--output FILE` for Windows. 2012-07-30 10:58:16 +02:00			`output.extend(b'\n')`
Fixed multipart requests output; binary support. * Bodies of multipart requests are correctly printed (closes #30). * Binary requests and responses should always work (they are also suppressed for terminal output). So things like this work:: http www.google.com/favicon.ico > favicon.ico 2012-07-28 05:45:44 +02:00			`else:`
Revorked output Binary now works everywhere. Also added `--output FILE` for Windows. 2012-07-30 10:58:16 +02:00			`if prettifier and msg.content_type:`
			`body = prettifier.process_body(`
			`body, msg.content_type).strip()`
Fixed multipart requests output; binary support. * Bodies of multipart requests are correctly printed (closes #30). * Binary requests and responses should always work (they are also suppressed for terminal output). So things like this work:: http www.google.com/favicon.ico > favicon.ico 2012-07-28 05:45:44 +02:00
Revorked output Binary now works everywhere. Also added `--output FILE` for Windows. 2012-07-30 10:58:16 +02:00			`body = body.encode(output_encoding, errors)`
Fixed multipart requests output; binary support. * Bodies of multipart requests are correctly printed (closes #30). * Binary requests and responses should always work (they are also suppressed for terminal output). So things like this work:: http www.google.com/favicon.ico > favicon.ico 2012-07-28 05:45:44 +02:00
Revorked output Binary now works everywhere. Also added `--output FILE` for Windows. 2012-07-30 10:58:16 +02:00			`output.extend(body)`
Fixed multipart requests output; binary support. * Bodies of multipart requests are correctly printed (closes #30). * Binary requests and responses should always work (they are also suppressed for terminal output). So things like this work:: http www.google.com/favicon.ico > favicon.ico 2012-07-28 05:45:44 +02:00
Revorked output Binary now works everywhere. Also added `--output FILE` for Windows. 2012-07-30 10:58:16 +02:00			`return bytes(output)`
Added support for terminal colors under Windows. Tested on Python 2.7 under Windows 7 with PowerShell and cmd.exe. Closes #36 2012-07-17 03:48:10 +02:00
Initial commit. 2012-02-25 13:39:38 +01:00
Improved highlighting of HTTP headers. Closes #60. 2012-07-20 21:54:41 +02:00			`class HTTPLexer(lexer.RegexLexer):`
Added docstrings, refactored input. 2012-07-26 06:37:03 +02:00			`"""Simplified HTTP lexer for Pygments.`
Improved highlighting of HTTP headers. Closes #60. 2012-07-20 21:54:41 +02:00
			`It only operates on headers and provides a stronger contrast between`
			`their names and values than the original one bundled with Pygments`
			(`pygments.lexers.text import HttpLexer`), especially when
			`Solarized color scheme is used.`

			`"""`
			`name = 'HTTP'`
			`aliases = ['http']`
			`filenames = ['*.http']`
			`tokens = {`
			`'root': [`
Initial commit. 2012-02-25 13:39:38 +01:00
Improved highlighting of HTTP headers. Closes #60. 2012-07-20 21:54:41 +02:00			`# Request-Line`
			`(r'([A-Z]+)( +)([^ ]+)( +)(HTTP)(/)(\d+\.\d+)',`
			`lexer.bygroups(`
			`token.Name.Function,`
			`token.Text,`
			`token.Name.Namespace,`
			`token.Text,`
			`token.Keyword.Reserved,`
			`token.Operator,`
			`token.Number`
			`)),`

			`# Response Status-Line`
			`(r'(HTTP)(/)(\d+\.\d+)( +)(\d{3})( +)(.+)',`
			`lexer.bygroups(`
			`token.Keyword.Reserved, # 'HTTP'`
			`token.Operator, # '/'`
			`token.Number, # Version`
			`token.Text,`
			`token.Number, # Status code`
			`token.Text,`
			`token.Name.Exception, # Reason`
			`)),`

			`# Header`
			`(r'(.?)( )(:)( *)(.+)', lexer.bygroups(`
			`token.Name.Attribute, # Name`
			`token.Text,`
			`token.Operator, # Colon`
			`token.Text,`
			`token.String # Value`
			`))`
			`]}`
Simplify vendor extension content-types since they are most likely lexable 2012-07-14 16:27:11 +02:00
Use the Pygments HTTP and JSON lexers 2012-04-26 13:05:59 +02:00
Added `models.Environment()`. Refactoring and general cleanup. 2012-07-21 02:59:43 +02:00			`class BaseProcessor(object):`

			`enabled = True`

			`def __init__(self, env, **kwargs):`
			`self.env = env`
			`self.kwargs = kwargs`

			`def process_headers(self, headers):`
			`return headers`

			`def process_body(self, content, content_type):`
			`return content`


			`class JSONProcessor(BaseProcessor):`

			`def process_body(self, content, content_type):`
			`if content_type == 'application/json':`
			`try:`
			`# Indent and sort the JSON data.`
			`content = json.dumps(`
			`json.loads(content),`
			`sort_keys=True,`
			`ensure_ascii=False,`
			`indent=4,`
			`)`
			`except ValueError:`
			`# Invalid JSON - we don't care.`
			`pass`
			`return content`


			`class PygmentsProcessor(BaseProcessor):`

			`def __init__(self, args, *kwargs):`
			`super(PygmentsProcessor, self).__init__(args, *kwargs)`

			`if not self.env.colors:`
			`self.enabled = False`
			`return`
use PrettyHttp class; working --headers and --body 2012-04-28 14:13:40 +02:00
Improved highlighting of HTTP headers. Closes #60. 2012-07-20 21:54:41 +02:00			`try:`
Added `models.Environment()`. Refactoring and general cleanup. 2012-07-21 02:59:43 +02:00			`style = get_style_by_name(`
			`self.kwargs.get('pygments_style', DEFAULT_STYLE))`
Improved highlighting of HTTP headers. Closes #60. 2012-07-20 21:54:41 +02:00			`except ClassNotFound:`
			`style = solarized.SolarizedStyle`
use PrettyHttp class; working --headers and --body 2012-04-28 14:13:40 +02:00
Added `models.Environment()`. Refactoring and general cleanup. 2012-07-21 02:59:43 +02:00			`if is_windows or self.env.colors == 256:`
			`fmt_class = Terminal256Formatter`
			`else:`
			`fmt_class = TerminalFormatter`
			`self.formatter = fmt_class(style=style)`
use PrettyHttp class; working --headers and --body 2012-04-28 14:13:40 +02:00
Added `models.Environment()`. Refactoring and general cleanup. 2012-07-21 02:59:43 +02:00			`def process_headers(self, headers):`
			`return pygments.highlight(`
			`headers, HTTPLexer(), self.formatter)`
Improved highlighting of HTTP headers. Closes #60. 2012-07-20 21:54:41 +02:00
Added `models.Environment()`. Refactoring and general cleanup. 2012-07-21 02:59:43 +02:00			`def process_body(self, content, content_type):`
			`try:`
			`lexer = get_lexer_for_mimetype(content_type)`
			`except ClassNotFound:`
			`pass`
			`else:`
			`content = pygments.highlight(content, lexer, self.formatter)`
			`return content`


			`class OutputProcessor(object):`

			`installed_processors = [`
			`JSONProcessor,`
			`PygmentsProcessor`
			`]`

			`def __init__(self, env, **kwargs):`
			`processors = [`
			`cls(env, **kwargs)`
			`for cls in self.installed_processors`
			`]`
			`self.processors = [p for p in processors if p.enabled]`

			`def process_headers(self, headers):`
			`for processor in self.processors:`
			`headers = processor.process_headers(headers)`
			`return headers`

			`def process_body(self, content, content_type):`
use PrettyHttp class; working --headers and --body 2012-04-28 14:13:40 +02:00			`content_type = content_type.split(';')[0]`
Improved highlighting of HTTP headers. Closes #60. 2012-07-20 21:54:41 +02:00
			`application_match = re.match(`
			`r'application/(.+\+)(json\|xml)$',`
			`content_type`
			`)`
Simplify vendor extension content-types since they are most likely lexable 2012-07-14 16:27:11 +02:00			`if application_match:`
			`# Strip vendor and extensions from Content-Type`
			`vendor, extension = application_match.groups()`
Python 3 fixes. 2012-07-17 01:26:21 +02:00			`content_type = content_type.replace(vendor, '')`
Simplify vendor extension content-types since they are most likely lexable 2012-07-14 16:27:11 +02:00
Added `models.Environment()`. Refactoring and general cleanup. 2012-07-21 02:59:43 +02:00			`for processor in self.processors:`
			`content = processor.process_body(content, content_type)`
Use the Pygments HTTP and JSON lexers 2012-04-26 13:05:59 +02:00
Added `models.Environment()`. Refactoring and general cleanup. 2012-07-21 02:59:43 +02:00			`return content`