Skip to content

Commit

Permalink
fix(file-ext): prevent users from bypassing checks on file extensions (
Browse files Browse the repository at this point in the history
…#1157)

* fix(sanitiser): remove comments from allow list

* fix(upload-utils): add detected file type to return value

* fix(mediafileservice): construct file + ext from be

* test(upload/media): add specs to ensure stuff is always sanitised

* test(markdown): update spec for empty string

* build(package): install dompurify

* refactor(utils): instantiate separate dompurify
  • Loading branch information
seaerchin authored Feb 22, 2024
1 parent e911e2e commit 5c56c74
Show file tree
Hide file tree
Showing 8 changed files with 167 additions and 42 deletions.
21 changes: 18 additions & 3 deletions package-lock.json

Some generated files are not rendered by default. Learn more about how customized files appear on GitHub.

2 changes: 2 additions & 0 deletions package.json
Original file line number Diff line number Diff line change
Expand Up @@ -34,6 +34,7 @@
"@octokit/rest": "^18.12.0",
"@opengovsg/formsg-sdk": "^0.11.0",
"@opengovsg/sgid-client": "^2.0.0",
"@types/dompurify": "^3.0.5",
"auto-bind": "^4.0.0",
"aws-lambda": "^1.0.7",
"aws-sdk": "^2.1428.0",
Expand All @@ -53,6 +54,7 @@
"crypto-js": "^4.2.0",
"dd-trace": "^4.7.0",
"debug": "~2.6.9",
"dompurify": "^3.0.9",
"dotenv": "^16.3.1",
"eventsource": "^2.0.2",
"exponential-backoff": "^3.1.0",
Expand Down
34 changes: 27 additions & 7 deletions src/services/fileServices/MdPageServices/MediaFileService.js
Original file line number Diff line number Diff line change
Expand Up @@ -41,18 +41,31 @@ class MediaFileService {
throw new BadRequestError("File did not pass virus scan")
}
}

// Sanitize and validate file
const sanitizedContent = await validateAndSanitizeFileUpload(content)
if (!sanitizedContent) {
const sanitisationResult = await validateAndSanitizeFileUpload(content)
if (!sanitisationResult) {
throw new MediaTypeError(`File extension is not within the approved list`)
}

const {
content: sanitizedContent,
detectedFileType: { ext },
} = sanitisationResult
// NOTE: We construct the extension based off what we detect as the file type
const constructedFileName = `${fileName
.split(".")
.slice(0, -1)
.join(".")}.${ext}`

const { sha } = await this.repoService.create(sessionData, {
content: sanitizedContent,
fileName,
fileName: constructedFileName,
directoryName,
isMedia: true,
})
return { name: fileName, content, sha }

return { name: constructedFileName, content, sha }
}

async read(sessionData, { fileName, directoryName }) {
Expand All @@ -64,18 +77,25 @@ class MediaFileService {

async update(sessionData, { fileName, directoryName, content, sha }) {
this.mediaNameChecks({ directoryName, fileName })
const sanitizedContent = await validateAndSanitizeFileUpload(content)
if (!sanitizedContent) {
const sanitisationResult = await validateAndSanitizeFileUpload(content)
if (!sanitisationResult) {
throw new MediaTypeError(`File extension is not within the approved list`)
}
const {
content: sanitizedContent,
detectedFileType: { ext },
} = sanitisationResult

// NOTE: We can trust the user input here
// as we are removing stuff from our system.
await this.repoService.delete(sessionData, {
sha,
fileName,
directoryName,
})
const { sha: newSha } = await this.repoService.create(sessionData, {
content: sanitizedContent,
fileName,
fileName: `${fileName.split(".").slice(0, -1).join(".")}.${ext}`,
directoryName,
isMedia: true,
})
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -2,20 +2,25 @@ const { config } = require("@config/config")

const { BadRequestError } = require("@errors/BadRequestError")

const {
MediaFileService,
} = require("@services/fileServices/MdPageServices/MediaFileService")

const GITHUB_ORG_NAME = config.get("github.orgName")

describe("Media File Service", () => {
const siteName = "test-site"
const accessToken = "test-token"
const imageName = "test image.png"
const imageEncodedName = encodeURIComponent(imageName)
const fileName = "test file.pdf"
const fileName = "test file.jpg"
const fileEncodedName = encodeURIComponent(fileName)
const directoryName = "images/subfolder"
const mockContent = "schema, test"
const mockSanitizedContent = "sanitized-test"
const sha = "12345"
const mockGithubSessionData = "githubData"
const mockContent =
""
const mockSanitizedContent = mockContent.split(",")[1]

const sessionData = { siteName, accessToken }

Expand All @@ -34,22 +39,16 @@ describe("Media File Service", () => {
updateRepoState: jest.fn(),
}

// NOTE: Mock just the scan function
// as we want to omit network calls.
jest.mock("@utils/file-upload-utils", () => ({
validateAndSanitizeFileUpload: jest
.fn()
.mockReturnValue(mockSanitizedContent),
ALLOWED_FILE_EXTENSIONS: ["pdf"],
...jest.requireActual("@utils/file-upload-utils"),
scanFileForVirus: jest.fn().mockReturnValue({ CleanResult: true }),
}))

const {
MediaFileService,
} = require("@services/fileServices/MdPageServices/MediaFileService")

const service = new MediaFileService({
repoService: mockRepoService,
})
const { validateAndSanitizeFileUpload } = require("@utils/file-upload-utils")

beforeEach(() => {
jest.clearAllMocks()
Expand All @@ -66,15 +65,16 @@ describe("Media File Service", () => {
).rejects.toThrowError(BadRequestError)
})

mockRepoService.create.mockResolvedValueOnce({ sha })
it("Creating pages works correctly", async () => {
await expect(
service.create(sessionData, {
fileName,
directoryName,
content: mockContent,
})
).resolves.toMatchObject({
// Arrange
mockRepoService.create.mockResolvedValueOnce({ sha })

const result = await service.create(sessionData, {
fileName,
directoryName,
content: mockContent,
})
expect(result).toMatchObject({
name: fileName,
content: mockContent,
sha,
Expand All @@ -85,7 +85,24 @@ describe("Media File Service", () => {
directoryName,
isMedia: true,
})
expect(validateAndSanitizeFileUpload).toHaveBeenCalledWith(mockContent)
})

it("should ignore the extension provided by the user", async () => {
// Arrange
mockRepoService.create.mockResolvedValueOnce({ sha })
const fileNameWithWrongExt = "wrong.html"

// Act
const result = await service.create(sessionData, {
fileName: fileNameWithWrongExt,
directoryName,
content: mockContent,
})

// Assert
// NOTE: The original extension here is not used.
// Instead, we use the inferred extension.
expect(result.name).toBe("wrong.jpg")
})
})

Expand Down Expand Up @@ -153,8 +170,8 @@ describe("Media File Service", () => {

describe("Update", () => {
const oldSha = "54321"
mockRepoService.create.mockResolvedValueOnce({ sha })
it("Updating media file content works correctly", async () => {
mockRepoService.create.mockResolvedValueOnce({ sha })
await expect(
service.update(sessionData, {
fileName,
Expand All @@ -179,7 +196,6 @@ describe("Media File Service", () => {
directoryName,
isMedia: true,
})
expect(validateAndSanitizeFileUpload).toHaveBeenCalledWith(mockContent)
})
})

Expand All @@ -197,7 +213,7 @@ describe("Media File Service", () => {
})

describe("Rename", () => {
const oldFileName = "test old file.pdf"
const oldFileName = "test old file.jpg"

it("rejects renaming to page names with special characters", async () => {
await expect(
Expand Down
2 changes: 1 addition & 1 deletion src/services/utilServices/Sanitizer.ts
Original file line number Diff line number Diff line change
@@ -1,7 +1,7 @@
import DOMPurify from "isomorphic-dompurify"

DOMPurify.setConfig({
ADD_TAGS: ["iframe", "#comment", "script"],
ADD_TAGS: ["iframe", "script"],
ADD_ATTR: [
"allow",
"allowfullscreen",
Expand Down
52 changes: 52 additions & 0 deletions src/utils/__tests__/file-upload-utils.spec.ts
Original file line number Diff line number Diff line change
@@ -0,0 +1,52 @@
import { validateAndSanitizeFileUpload } from "../file-upload-utils"

describe("file-upload-utils", () => {
it("should preserve the original file type for binary format files", async () => {
// Arrange
const content =
""
const expectedExtension = "png"

// Act
const result = await validateAndSanitizeFileUpload(content)

// Assert
expect(result).toBeDefined()
expect(result?.detectedFileType.ext).toBe(expectedExtension)
})

it("should sanitize svgs with alerts", async () => {
// Arrange
// NOTE: This is a svg with an `alert` in html comments
const maliciousContent = `data:application/pdf;base64,PCEtLQphbGVydChkb2N1bWVudC5kb21haW4pCi8qCi0tPgo8c3ZnIGlkPSJzdmcyIiB4bWxucz0iaHR0cDovL3d3dy53My5vcmcvMjAwMC9zdmciIHZpZXdCb3g9IjAgMCA5MDAgOTAwIiB2ZXJzaW9uPSIxLjEiPgo8L3N2Zz4KPCEtLSAqLyAKLS0+Cg==`
const expectedExtension = "svg"

// Act
const result = await validateAndSanitizeFileUpload(maliciousContent)
const sanitisedContent = Buffer.from(result?.content, "base64").toString()

// Assert
expect(result).toBeDefined()
expect(result?.detectedFileType.ext).toBe(expectedExtension)
expect(sanitisedContent).not.toContain("alert")
})

it("should sanitize svgs with scripts", async () => {
// Arrange
// NOTE: Our sanitizer for files/html allows script tag
// however, the svg sanitizer does not as it is stricter
// and to prevent xss attacks.
const maliciousContent = `data:image/png;base64,${Buffer.from(
`<svg version="1.1" viewBox="0 0 900 900" xmlns="http://www.w3.org/2000/svg" id="svg2"><script src = "evil.com"></script></svg>`
).toString("base64")}`
const expectedExtension = "svg"

// Act
const result = await validateAndSanitizeFileUpload(maliciousContent)

// Assert
expect(result).toBeDefined()
expect(result?.detectedFileType.ext).toBe(expectedExtension)
expect(result).not.toContain("script")
})
})
4 changes: 2 additions & 2 deletions src/utils/__tests__/markdown-utils.spec.ts
Original file line number Diff line number Diff line change
Expand Up @@ -103,8 +103,8 @@ describe("Sanitized markdown utils test", () => {
)
})

it("should inject a html comment tag when the string is empty", () => {
expect(sanitizer.sanitize("")).toBe(HTML_COMMENT_TAG)
it("should not perform sanitisation when the string is empty", () => {
expect(sanitizer.sanitize("")).toBe("")
})
})
})
Loading

0 comments on commit 5c56c74

Please sign in to comment.