File: test_line_ending.py

package info (click to toggle)
dulwich 1.0.0-2
links: PTS, VCS
area: main
in suites: sid
size: 7,388 kB
sloc: python: 99,991; makefile: 163; sh: 67
file content (690 lines) | stat: -rw-r--r-- 25,662 bytes
parent folder | download | duplicates (2)
# test_line_ending.py -- Tests for the line ending functions
# Copyright (C) 2018-2019 Boris Feld <boris.feld@comet.ml>
#
# SPDX-License-Identifier: Apache-2.0 OR GPL-2.0-or-later
# Dulwich is dual-licensed under the Apache License, Version 2.0 and the GNU
# General Public License as published by the Free Software Foundation; version 2.0
# or (at your option) any later version. You can redistribute it and/or
# modify it under the terms of either of these two licenses.
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
#
# You should have received a copy of the licenses; if not, see
# <http://www.gnu.org/licenses/> for a copy of the GNU General Public License
# and <http://www.apache.org/licenses/LICENSE-2.0> for a copy of the Apache
# License, Version 2.0.
#

"""Tests for the line ending conversion."""

from dulwich.line_ending import (
    BlobNormalizer,
    LineEndingFilter,
    TreeBlobNormalizer,
    check_safecrlf,
    convert_crlf_to_lf,
    convert_lf_to_crlf,
    get_clean_filter_autocrlf,
    get_smudge_filter_autocrlf,
    normalize_blob,
)
from dulwich.objects import Blob

from . import TestCase


class LineEndingConversion(TestCase):
    """Test the line ending conversion functions in various cases."""

    def test_convert_crlf_to_lf_no_op(self) -> None:
        self.assertEqual(convert_crlf_to_lf(b"foobar"), b"foobar")

    def test_convert_crlf_to_lf(self) -> None:
        self.assertEqual(convert_crlf_to_lf(b"line1\r\nline2"), b"line1\nline2")

    def test_convert_crlf_to_lf_mixed(self) -> None:
        self.assertEqual(convert_crlf_to_lf(b"line1\r\n\nline2"), b"line1\n\nline2")

    def test_convert_lf_to_crlf_no_op(self) -> None:
        self.assertEqual(convert_lf_to_crlf(b"foobar"), b"foobar")

    def test_convert_lf_to_crlf(self) -> None:
        self.assertEqual(convert_lf_to_crlf(b"line1\nline2"), b"line1\r\nline2")

    def test_convert_lf_to_crlf_mixed(self) -> None:
        self.assertEqual(convert_lf_to_crlf(b"line1\r\n\nline2"), b"line1\r\n\r\nline2")


class GetLineEndingAutocrlfFilters(TestCase):
    def test_get_clean_filter_autocrlf_default(self) -> None:
        clean_filter = get_clean_filter_autocrlf(b"false")

        self.assertEqual(clean_filter, None)

    def test_get_clean_filter_autocrlf_true(self) -> None:
        clean_filter = get_clean_filter_autocrlf(b"true")

        self.assertEqual(clean_filter, convert_crlf_to_lf)

    def test_get_clean_filter_autocrlf_input(self) -> None:
        clean_filter = get_clean_filter_autocrlf(b"input")

        self.assertEqual(clean_filter, convert_crlf_to_lf)

    def test_get_smudge_filter_autocrlf_default(self) -> None:
        smudge_filter = get_smudge_filter_autocrlf(b"false")

        self.assertEqual(smudge_filter, None)

    def test_get_smudge_filter_autocrlf_true(self) -> None:
        smudge_filter = get_smudge_filter_autocrlf(b"true")

        self.assertEqual(smudge_filter, convert_lf_to_crlf)

    def test_get_smudge_filter_autocrlf_input(self) -> None:
        smudge_filter = get_smudge_filter_autocrlf(b"input")

        self.assertEqual(smudge_filter, None)


class NormalizeBlobTestCase(TestCase):
    def test_normalize_to_lf_no_op(self) -> None:
        base_content = b"line1\nline2"
        base_sha = "f8be7bb828880727816015d21abcbc37d033f233"

        base_blob = Blob()
        base_blob.set_raw_string(base_content)

        self.assertEqual(base_blob.as_raw_chunks(), [base_content])
        self.assertEqual(base_blob.sha().hexdigest(), base_sha)

        filtered_blob = normalize_blob(
            base_blob, convert_crlf_to_lf, binary_detection=False
        )

        self.assertEqual(filtered_blob.as_raw_chunks(), [base_content])
        self.assertEqual(filtered_blob.sha().hexdigest(), base_sha)

    def test_normalize_to_lf(self) -> None:
        base_content = b"line1\r\nline2"
        base_sha = "3a1bd7a52799fe5cf6411f1d35f4c10bacb1db96"

        base_blob = Blob()
        base_blob.set_raw_string(base_content)

        self.assertEqual(base_blob.as_raw_chunks(), [base_content])
        self.assertEqual(base_blob.sha().hexdigest(), base_sha)

        filtered_blob = normalize_blob(
            base_blob, convert_crlf_to_lf, binary_detection=False
        )

        normalized_content = b"line1\nline2"
        normalized_sha = "f8be7bb828880727816015d21abcbc37d033f233"

        self.assertEqual(filtered_blob.as_raw_chunks(), [normalized_content])
        self.assertEqual(filtered_blob.sha().hexdigest(), normalized_sha)

    def test_normalize_to_lf_binary(self) -> None:
        base_content = b"line1\r\nline2\0"
        base_sha = "b44504193b765f7cd79673812de8afb55b372ab2"

        base_blob = Blob()
        base_blob.set_raw_string(base_content)

        self.assertEqual(base_blob.as_raw_chunks(), [base_content])
        self.assertEqual(base_blob.sha().hexdigest(), base_sha)

        filtered_blob = normalize_blob(
            base_blob, convert_crlf_to_lf, binary_detection=True
        )

        self.assertEqual(filtered_blob.as_raw_chunks(), [base_content])
        self.assertEqual(filtered_blob.sha().hexdigest(), base_sha)

    def test_normalize_to_crlf_no_op(self) -> None:
        base_content = b"line1\r\nline2"
        base_sha = "3a1bd7a52799fe5cf6411f1d35f4c10bacb1db96"

        base_blob = Blob()
        base_blob.set_raw_string(base_content)

        self.assertEqual(base_blob.as_raw_chunks(), [base_content])
        self.assertEqual(base_blob.sha().hexdigest(), base_sha)

        filtered_blob = normalize_blob(
            base_blob, convert_lf_to_crlf, binary_detection=False
        )

        self.assertEqual(filtered_blob.as_raw_chunks(), [base_content])
        self.assertEqual(filtered_blob.sha().hexdigest(), base_sha)

    def test_normalize_to_crlf(self) -> None:
        base_content = b"line1\nline2"
        base_sha = "f8be7bb828880727816015d21abcbc37d033f233"

        base_blob = Blob()
        base_blob.set_raw_string(base_content)

        self.assertEqual(base_blob.as_raw_chunks(), [base_content])
        self.assertEqual(base_blob.sha().hexdigest(), base_sha)

        filtered_blob = normalize_blob(
            base_blob, convert_lf_to_crlf, binary_detection=False
        )

        normalized_content = b"line1\r\nline2"
        normalized_sha = "3a1bd7a52799fe5cf6411f1d35f4c10bacb1db96"

        self.assertEqual(filtered_blob.as_raw_chunks(), [normalized_content])
        self.assertEqual(filtered_blob.sha().hexdigest(), normalized_sha)

    def test_normalize_to_crlf_binary(self) -> None:
        base_content = b"line1\r\nline2\0"
        base_sha = "b44504193b765f7cd79673812de8afb55b372ab2"

        base_blob = Blob()
        base_blob.set_raw_string(base_content)

        self.assertEqual(base_blob.as_raw_chunks(), [base_content])
        self.assertEqual(base_blob.sha().hexdigest(), base_sha)

        filtered_blob = normalize_blob(
            base_blob, convert_lf_to_crlf, binary_detection=True
        )

        self.assertEqual(filtered_blob.as_raw_chunks(), [base_content])
        self.assertEqual(filtered_blob.sha().hexdigest(), base_sha)


class LineEndingFilterTests(TestCase):
    """Test the LineEndingFilter class."""

    def test_clean_no_conversion(self) -> None:
        """Test clean with no conversion function."""
        filter = LineEndingFilter()
        data = b"test\r\ndata"
        self.assertEqual(filter.clean(data), data)

    def test_clean_with_conversion(self) -> None:
        """Test clean with CRLF to LF conversion."""
        filter = LineEndingFilter(clean_conversion=convert_crlf_to_lf)
        data = b"test\r\ndata"
        self.assertEqual(filter.clean(data), b"test\ndata")

    def test_clean_binary_detection(self) -> None:
        """Test clean skips binary files."""
        filter = LineEndingFilter(
            clean_conversion=convert_crlf_to_lf, binary_detection=True
        )
        # Binary data with null byte
        data = b"test\r\n\x00data"
        self.assertEqual(filter.clean(data), data)  # Should not convert

    def test_smudge_no_conversion(self) -> None:
        """Test smudge with no conversion function."""
        filter = LineEndingFilter()
        data = b"test\ndata"
        self.assertEqual(filter.smudge(data), data)

    def test_smudge_with_conversion(self) -> None:
        """Test smudge with LF to CRLF conversion."""
        filter = LineEndingFilter(smudge_conversion=convert_lf_to_crlf)
        data = b"test\ndata"
        self.assertEqual(filter.smudge(data), b"test\r\ndata")

    def test_smudge_binary_detection(self) -> None:
        """Test smudge skips binary files."""
        filter = LineEndingFilter(
            smudge_conversion=convert_lf_to_crlf, binary_detection=True
        )
        # Binary data with null byte
        data = b"test\n\x00data"
        self.assertEqual(filter.smudge(data), data)  # Should not convert


class BlobNormalizerTests(TestCase):
    """Test the BlobNormalizer class integration with filters."""

    def setUp(self) -> None:
        super().setUp()
        from dulwich.config import ConfigDict

        self.config = ConfigDict()
        self.gitattributes = {}

    def test_autocrlf_true_checkin(self) -> None:
        """Test checkin with autocrlf=true."""
        normalizer = BlobNormalizer(self.config, self.gitattributes, autocrlf=b"true")

        # Create blob with CRLF
        blob = Blob()
        blob.data = b"line1\r\nline2\r\n"

        # Should convert to LF on checkin
        result = normalizer.checkin_normalize(blob, b"test.txt")
        self.assertEqual(result.data, b"line1\nline2\n")

    def test_autocrlf_true_checkout(self) -> None:
        """Test checkout with autocrlf=true."""
        normalizer = BlobNormalizer(self.config, self.gitattributes, autocrlf=b"true")

        # Create blob with LF
        blob = Blob()
        blob.data = b"line1\nline2\n"

        # Should convert to CRLF on checkout
        result = normalizer.checkout_normalize(blob, b"test.txt")
        self.assertEqual(result.data, b"line1\r\nline2\r\n")

    def test_autocrlf_input_checkin(self) -> None:
        """Test checkin with autocrlf=input."""
        normalizer = BlobNormalizer(self.config, self.gitattributes, autocrlf=b"input")

        # Create blob with CRLF
        blob = Blob()
        blob.data = b"line1\r\nline2\r\n"

        # Should convert to LF on checkin
        result = normalizer.checkin_normalize(blob, b"test.txt")
        self.assertEqual(result.data, b"line1\nline2\n")

    def test_autocrlf_input_checkout(self) -> None:
        """Test checkout with autocrlf=input."""
        normalizer = BlobNormalizer(self.config, self.gitattributes, autocrlf=b"input")

        # Create blob with LF
        blob = Blob()
        blob.data = b"line1\nline2\n"

        # Should NOT convert on checkout with input mode
        result = normalizer.checkout_normalize(blob, b"test.txt")
        self.assertIs(result, blob)  # Same object, no conversion

    def test_autocrlf_false(self) -> None:
        """Test with autocrlf=false (no conversion)."""
        normalizer = BlobNormalizer(self.config, self.gitattributes, autocrlf=b"false")

        # Create blob with mixed line endings
        blob = Blob()
        blob.data = b"line1\r\nline2\nline3"

        # Should not convert on either operation
        result = normalizer.checkin_normalize(blob, b"test.txt")
        self.assertIs(result, blob)

        result = normalizer.checkout_normalize(blob, b"test.txt")
        self.assertIs(result, blob)

    def test_gitattributes_text_attr(self) -> None:
        """Test gitattributes text attribute overrides autocrlf."""
        # Set gitattributes to force text conversion
        self.gitattributes[b"*.txt"] = {b"text": True}

        # Even with autocrlf=false, should convert based on gitattributes
        normalizer = BlobNormalizer(self.config, self.gitattributes, autocrlf=b"false")

        blob = Blob()
        blob.data = b"line1\r\nline2\r\n"

        # Should still convert because of gitattributes
        result = normalizer.checkin_normalize(blob, b"test.txt")
        # Note: with just text=true and no eol setting, it follows platform defaults
        # For checkin, it should always normalize to LF
        self.assertIsNot(result, blob)

    def test_gitattributes_binary_attr(self) -> None:
        """Test gitattributes -text attribute prevents conversion."""
        # Set gitattributes to force binary (no conversion)
        self.gitattributes[b"*.bin"] = {b"text": False}

        normalizer = BlobNormalizer(self.config, self.gitattributes, autocrlf=b"true")

        blob = Blob()
        blob.data = b"line1\r\nline2\r\n"

        # Should not convert despite autocrlf=true
        result = normalizer.checkin_normalize(blob, b"test.bin")
        self.assertIs(result, blob)

    def test_binary_file_detection(self) -> None:
        """Test that binary files are not converted."""
        normalizer = BlobNormalizer(self.config, self.gitattributes, autocrlf=b"true")

        # Create blob with binary content
        blob = Blob()
        blob.data = b"line1\r\n\x00\xffbinary\r\ndata"

        # Should not convert binary files
        result = normalizer.checkin_normalize(blob, b"binary.dat")
        self.assertIs(result, blob)

        result = normalizer.checkout_normalize(blob, b"binary.dat")
        self.assertIs(result, blob)


class TreeBlobNormalizerTests(TestCase):
    """Test the TreeBlobNormalizer class for existing file handling."""

    def setUp(self) -> None:
        super().setUp()
        from dulwich.config import ConfigDict
        from dulwich.object_store import MemoryObjectStore

        self.config = ConfigDict()
        self.gitattributes = {}
        self.object_store = MemoryObjectStore()

    def test_autocrlf_input_existing_files(self) -> None:
        """Test that autocrlf=input normalizes existing files with CRLF."""
        # Create a tree with an existing file
        from dulwich.objects import Tree

        tree = Tree()
        tree[b"existing.txt"] = (0o100644, b"a" * 40)  # dummy sha
        self.object_store.add_object(tree)

        # Create normalizer with autocrlf=input
        normalizer = TreeBlobNormalizer(
            self.config,
            self.gitattributes,
            self.object_store,
            tree.id,
            autocrlf=b"input",
        )

        # Create blob with CRLF line endings
        blob = Blob()
        blob.data = b"line1\r\nline2\r\n"

        # Should convert CRLF to LF on checkin even for existing files
        result = normalizer.checkin_normalize(blob, b"existing.txt")
        self.assertEqual(result.data, b"line1\nline2\n")

    def test_autocrlf_false_existing_files(self) -> None:
        """Test that autocrlf=false does not normalize existing files."""
        # Create a tree with an existing file
        from dulwich.objects import Tree

        tree = Tree()
        tree[b"existing.txt"] = (0o100644, b"a" * 40)  # dummy sha
        self.object_store.add_object(tree)

        # Create normalizer with autocrlf=false
        normalizer = TreeBlobNormalizer(
            self.config,
            self.gitattributes,
            self.object_store,
            tree.id,
            autocrlf=b"false",
        )

        # Create blob with CRLF line endings
        blob = Blob()
        blob.data = b"line1\r\nline2\r\n"

        # Should NOT convert for existing files when autocrlf=false
        result = normalizer.checkin_normalize(blob, b"existing.txt")
        self.assertIs(result, blob)

    def test_autocrlf_input_new_files(self) -> None:
        """Test that autocrlf=input normalizes new files."""
        # Create empty tree (no existing files)
        from dulwich.objects import Tree

        tree = Tree()
        self.object_store.add_object(tree)

        # Create normalizer with autocrlf=input
        normalizer = TreeBlobNormalizer(
            self.config,
            self.gitattributes,
            self.object_store,
            tree.id,
            autocrlf=b"input",
        )

        # Create blob with CRLF line endings
        blob = Blob()
        blob.data = b"line1\r\nline2\r\n"

        # Should convert CRLF to LF for new files
        result = normalizer.checkin_normalize(blob, b"new.txt")
        self.assertEqual(result.data, b"line1\nline2\n")


class LineEndingIntegrationTests(TestCase):
    """Integration tests for line ending conversion with the filter system."""

    def setUp(self) -> None:
        super().setUp()
        from dulwich.config import ConfigDict
        from dulwich.filters import FilterRegistry

        self.config = ConfigDict()
        self.registry = FilterRegistry(self.config)

    def test_filter_registry_with_line_endings(self) -> None:
        """Test that line ending filters work through the registry."""
        # Register a custom text filter that does line ending conversion
        filter = LineEndingFilter(
            clean_conversion=convert_crlf_to_lf,
            smudge_conversion=convert_lf_to_crlf,
            binary_detection=True,
        )
        self.registry.register_driver("text", filter)

        # Set up gitattributes
        # Create GitAttributes
        from dulwich.attrs import GitAttributes, Pattern

        patterns = [(Pattern(b"*.txt"), {b"filter": b"text"})]
        gitattributes = GitAttributes(patterns)

        # Create normalizer
        from dulwich.filters import FilterBlobNormalizer, FilterContext

        filter_context = FilterContext(self.registry)
        normalizer = FilterBlobNormalizer(
            self.config, gitattributes, filter_context=filter_context
        )

        # Test round trip
        blob = Blob()
        blob.data = b"Hello\r\nWorld\r\n"

        # Checkin should convert CRLF to LF
        checked_in = normalizer.checkin_normalize(blob, b"test.txt")
        self.assertEqual(checked_in.data, b"Hello\nWorld\n")

        # Checkout should convert LF to CRLF
        checked_out = normalizer.checkout_normalize(checked_in, b"test.txt")
        self.assertEqual(checked_out.data, b"Hello\r\nWorld\r\n")

    def test_mixed_filters(self) -> None:
        """Test multiple filters can coexist (line endings and LFS)."""
        # This would be a more complex test requiring LFS setup
        # For now, just verify the structure works
        text_filter = LineEndingFilter(
            clean_conversion=convert_crlf_to_lf,
            smudge_conversion=convert_lf_to_crlf,
        )
        self.registry.register_driver("text", text_filter)

        # Mock LFS filter
        class MockLFSFilter:
            def clean(self, data):
                return b"LFS pointer"

            def smudge(self, data):
                return b"LFS content"

            def cleanup(self):
                pass

            def reuse(self, config, filter_name):
                return False

        self.registry.register_driver("lfs", MockLFSFilter())

        # Different files use different filters
        from dulwich.attrs import GitAttributes, Pattern

        patterns = [
            (Pattern(b"*.txt"), {b"filter": b"text"}),
            (Pattern(b"*.bin"), {b"filter": b"lfs"}),
        ]
        gitattributes = GitAttributes(patterns)

        from dulwich.filters import FilterBlobNormalizer, FilterContext

        filter_context = FilterContext(self.registry)
        normalizer = FilterBlobNormalizer(
            self.config, gitattributes, filter_context=filter_context
        )

        # Text file gets line ending conversion
        text_blob = Blob()
        text_blob.data = b"text\r\nfile"
        result = normalizer.checkin_normalize(text_blob, b"test.txt")
        self.assertEqual(result.data, b"text\nfile")

        # Binary file gets LFS conversion
        bin_blob = Blob()
        bin_blob.data = b"binary content"
        result = normalizer.checkin_normalize(bin_blob, b"test.bin")
        self.assertEqual(result.data, b"LFS pointer")


class LineEndingFilterFromConfigTests(TestCase):
    """Test LineEndingFilter.from_config classmethod."""

    def test_from_config_none(self) -> None:
        """Test from_config with no config."""
        # No config, not for text attr - no conversion
        filter = LineEndingFilter.from_config(None, for_text_attr=False)
        self.assertIsNone(filter.clean_conversion)
        self.assertIsNone(filter.smudge_conversion)
        self.assertEqual(filter.safecrlf, b"false")

        # No config, for text attr - normalize on checkin
        filter = LineEndingFilter.from_config(None, for_text_attr=True)
        self.assertIsNotNone(filter.clean_conversion)
        self.assertIsNone(filter.smudge_conversion)
        self.assertEqual(filter.safecrlf, b"false")

    def test_from_config_autocrlf_true(self) -> None:
        """Test from_config with autocrlf=true."""
        from dulwich.config import ConfigDict

        config = ConfigDict()
        config.set(b"core", b"autocrlf", b"true")

        filter = LineEndingFilter.from_config(config, for_text_attr=False)
        self.assertIsNotNone(filter.clean_conversion)
        self.assertIsNotNone(filter.smudge_conversion)
        self.assertEqual(filter.safecrlf, b"false")

    def test_from_config_with_safecrlf(self) -> None:
        """Test from_config with safecrlf setting."""
        from dulwich.config import ConfigDict

        config = ConfigDict()
        config.set(b"core", b"autocrlf", b"input")
        config.set(b"core", b"safecrlf", b"warn")

        filter = LineEndingFilter.from_config(config, for_text_attr=False)
        self.assertIsNotNone(filter.clean_conversion)
        self.assertIsNone(filter.smudge_conversion)
        self.assertEqual(filter.safecrlf, b"warn")

    def test_from_config_text_attr_overrides(self) -> None:
        """Test that for_text_attr=True always normalizes on checkin."""
        from dulwich.config import ConfigDict

        config = ConfigDict()
        config.set(b"core", b"autocrlf", b"false")

        # Even with autocrlf=false, text attr should normalize
        filter = LineEndingFilter.from_config(config, for_text_attr=True)
        self.assertIsNotNone(filter.clean_conversion)
        # Smudge should still be None since autocrlf=false
        self.assertIsNone(filter.smudge_conversion)


class SafeCRLFTests(TestCase):
    """Test core.safecrlf functionality."""

    def test_safecrlf_false(self) -> None:
        """Test that safecrlf=false allows any conversion."""
        original = b"line1\r\nline2\r\n"
        converted = b"line1\nline2\n"
        # Should not raise
        check_safecrlf(original, converted, b"false", b"test.txt")

    def test_safecrlf_true_safe_conversion(self) -> None:
        """Test that safecrlf=true allows safe conversions."""
        # CRLF -> LF -> CRLF is reversible
        original = b"line1\r\nline2\r\n"
        converted = b"line1\nline2\n"
        # Should not raise because conversion is reversible
        check_safecrlf(original, converted, b"true", b"test.txt")

    def test_safecrlf_true_unsafe_conversion(self) -> None:
        """Test that safecrlf=true fails on unsafe conversions."""
        # Mixed line endings would be lost
        original = b"line1\r\nline2\nline3\r\n"
        converted = b"line1\nline2\nline3\n"
        # Should raise because converting back gives all CRLF
        with self.assertRaises(ValueError) as cm:
            check_safecrlf(original, converted, b"true", b"test.txt")
        self.assertIn("CRLF would be replaced by LF", str(cm.exception))

    def test_safecrlf_warn(self) -> None:
        """Test that safecrlf=warn issues warnings."""
        # Mixed line endings would be lost
        original = b"line1\r\nline2\nline3\r\n"
        converted = b"line1\nline2\nline3\n"
        # Should warn but not raise
        with self.assertLogs("dulwich.line_ending", level="WARNING") as cm:
            check_safecrlf(original, converted, b"warn", b"test.txt")
            self.assertEqual(len(cm.output), 1)
            self.assertIn("CRLF would be replaced by LF", cm.output[0])

    def test_lineending_filter_with_safecrlf(self) -> None:
        """Test LineEndingFilter with safecrlf enabled."""
        # Test with safecrlf=true
        filter_strict = LineEndingFilter(
            clean_conversion=convert_crlf_to_lf,
            smudge_conversion=None,
            binary_detection=False,
            safecrlf=b"true",
        )

        # Safe conversion should work
        safe_data = b"line1\r\nline2\r\n"
        result = filter_strict.clean(safe_data, b"test.txt")
        self.assertEqual(result, b"line1\nline2\n")

        # Unsafe conversion should fail
        unsafe_data = b"line1\r\nline2\nline3\r\n"
        with self.assertRaises(ValueError):
            filter_strict.clean(unsafe_data, b"test.txt")

        # Test with safecrlf=warn
        filter_warn = LineEndingFilter(
            clean_conversion=convert_crlf_to_lf,
            smudge_conversion=None,
            binary_detection=False,
            safecrlf=b"warn",
        )

        # Should warn but still convert
        with self.assertLogs("dulwich.line_ending", level="WARNING") as cm:
            result = filter_warn.clean(unsafe_data, b"test.txt")
            self.assertEqual(result, b"line1\nline2\nline3\n")
            self.assertEqual(len(cm.output), 1)