mattermost/server/platform/services/docextractor/archive_test.go
Christopher Poile fb11968f87
[MM-65701] Fix for docextractor archive handling (#34983)
* do not attempt to decompress 7zip files in docextractor

* use SevenZip.Match to detect a 7z file instead of our own method

* merge conflicts

---------

Co-authored-by: Mattermost Build <build@mattermost.com>
2026-03-25 19:17:33 +00:00

52 lines
2 KiB
Go

// Copyright (c) 2015-present Mattermost, Inc. All Rights Reserved.
// See LICENSE.txt for license information.
package docextractor
import (
"bytes"
"testing"
"github.com/stretchr/testify/assert"
"github.com/stretchr/testify/require"
)
func TestArchiveExtractorSkips7zip(t *testing.T) {
ae := &archiveExtractor{}
t.Run("7zip file with .7z extension returns empty string", func(t *testing.T) {
// Valid 7zip header (minimal)
sevenZipData := []byte{0x37, 0x7a, 0xbc, 0xaf, 0x27, 0x1c, 0x00, 0x00}
result, err := ae.Extract("test.7z", bytes.NewReader(sevenZipData), 0)
require.NoError(t, err)
assert.Empty(t, result)
})
t.Run("7zip content with wrong extension is still blocked", func(t *testing.T) {
// 7zip content disguised with .zip extension - should still be blocked via stream detection
sevenZipData := []byte{0x37, 0x7a, 0xbc, 0xaf, 0x27, 0x1c, 0x00, 0x00}
result, err := ae.Extract("malicious.zip", bytes.NewReader(sevenZipData), 0)
require.NoError(t, err)
assert.Empty(t, result)
})
t.Run("7zip at offset with .7z extension is blocked via filename", func(t *testing.T) {
junkPrefix := []byte{0x00, 0x00, 0x00, 0x00}
sevenZipSig := []byte{0x37, 0x7a, 0xbc, 0xaf, 0x27, 0x1c, 0x00, 0x00}
dataWithOffset := append(junkPrefix, sevenZipSig...)
result, err := ae.Extract("test.7z", bytes.NewReader(dataWithOffset), 0)
require.NoError(t, err)
assert.Empty(t, result)
})
t.Run("7zip at offset with wrong extension fails safely", func(t *testing.T) {
// Edge case: 7zip content at offset with non-.7z extension.
// Our check won't catch it (ByName=false, ByStream=false), but archives.FileSystem
// also won't identify it as 7zip, so it fails to extract rather than triggering OOM.
junkPrefix := []byte{0x00, 0x00, 0x00, 0x00}
sevenZipSig := []byte{0x37, 0x7a, 0xbc, 0xaf, 0x27, 0x1c, 0x00, 0x00}
dataWithOffset := append(junkPrefix, sevenZipSig...)
_, err := ae.Extract("malicious.zip", bytes.NewReader(dataWithOffset), 0)
assert.Error(t, err) // fails to extract as any valid archive format
})
}