File: test_extractoutput.py

package info (click to toggle)
nbconvert 7.17.0-1
  • links: PTS, VCS
  • area: main
  • in suites: forky, sid
  • size: 3,056 kB
  • sloc: python: 8,449; makefile: 199; javascript: 2
file content (86 lines) | stat: -rw-r--r-- 3,219 bytes parent folder | download | duplicates (2)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
"""Tests for the extractoutput preprocessor"""

# Copyright (c) IPython Development Team.
# Distributed under the terms of the Modified BSD License.

import json

from nbconvert.preprocessors.extractoutput import ExtractOutputPreprocessor

from .base import PreprocessorTestsBase


class TestExtractOutput(PreprocessorTestsBase):
    """Contains test functions for extractoutput.py"""

    def build_preprocessor(self):
        """Make an instance of a preprocessor"""
        preprocessor = ExtractOutputPreprocessor()
        preprocessor.extract_output_types = {"text/plain", "image/png", "application/pdf"}
        preprocessor.enabled = True
        return preprocessor

    def test_constructor(self):
        """Can a ExtractOutputPreprocessor be constructed?"""
        self.build_preprocessor()

    def test_output(self):
        """Test the output of the ExtractOutputPreprocessor"""
        nb = self.build_notebook()
        res = self.build_resources()
        preprocessor = self.build_preprocessor()
        nb, res = preprocessor(nb, res)
        # Check if text was extracted.
        output = nb.cells[0].outputs[1]
        self.assertIn("filenames", output.metadata)
        self.assertIn("text/plain", output.metadata.filenames)
        text_filename = output.metadata.filenames["text/plain"]

        # Check if png was extracted.
        output = nb.cells[0].outputs[6]
        self.assertIn("filenames", output.metadata)
        self.assertIn("image/png", output.metadata.filenames)
        png_filename = output.metadata.filenames["image/png"]

        # Check that pdf was extracted
        output = nb.cells[0].outputs[7]
        self.assertIn("filenames", output.metadata)
        self.assertIn("application/pdf", output.metadata.filenames)
        pdf_filename = output.metadata.filenames["application/pdf"]

        # Verify text output
        self.assertIn(text_filename, res["outputs"])
        self.assertEqual(res["outputs"][text_filename], b"b")

        # Verify png output
        self.assertIn(png_filename, res["outputs"])
        self.assertEqual(res["outputs"][png_filename], b"g")

        # Verify pdf output
        self.assertIn(pdf_filename, res["outputs"])
        self.assertEqual(res["outputs"][pdf_filename], b"h")

    def test_json_extraction(self):
        nb = self.build_notebook(with_json_outputs=True)
        res = self.build_resources()
        preprocessor = self.build_preprocessor()
        preprocessor.extract_output_types = {"application/json"}
        nb, res = preprocessor(nb, res)
        reference = self.build_notebook(with_json_outputs=True).cells[0].outputs

        # Verify cell untouched
        self.assertEqual(
            [out.get("data") for out in nb.cells[0].outputs], [out.get("data") for out in reference]
        )

        outputs = sorted(res["outputs"].values())
        reference_files = []
        for out in reference:
            try:
                data = out["data"]["application/json"]
                reference_files.append(json.dumps(data).encode())
            except KeyError:
                pass

        # Verify equivalence of extracted outputs.
        self.assertEqual(sorted(outputs), sorted(reference_files))