|
| 1 | +import { describe, expect, it } from "vitest"; |
| 2 | +import { stripFilenameControlChars } from "./outbound-filename.js"; |
| 3 | + |
| 4 | +const c = (code: number): string => String.fromCharCode(code); |
| 5 | + |
| 6 | +describe("stripFilenameControlChars", () => { |
| 7 | + it("returns plain ASCII filenames unchanged", () => { |
| 8 | + expect(stripFilenameControlChars("report.pdf")).toBe("report.pdf"); |
| 9 | + expect(stripFilenameControlChars("a.b-c_d.tar.gz")).toBe("a.b-c_d.tar.gz"); |
| 10 | + }); |
| 11 | + |
| 12 | + it("preserves non-ASCII letters and digits", () => { |
| 13 | + expect(stripFilenameControlChars("日本語_2025.pdf")).toBe("日本語_2025.pdf"); |
| 14 | + expect(stripFilenameControlChars("отчет.docx")).toBe("отчет.docx"); |
| 15 | + expect(stripFilenameControlChars("ملف.pdf")).toBe("ملف.pdf"); |
| 16 | + }); |
| 17 | + |
| 18 | + it.each([ |
| 19 | + { name: "C0 control NUL", code: 0x0000 }, |
| 20 | + { name: "C0 control TAB", code: 0x0009 }, |
| 21 | + { name: "C0 control LF", code: 0x000a }, |
| 22 | + { name: "C0 control CR", code: 0x000d }, |
| 23 | + { name: "C0 control US", code: 0x001f }, |
| 24 | + { name: "DEL", code: 0x007f }, |
| 25 | + { name: "C1 control PAD", code: 0x0080 }, |
| 26 | + { name: "C1 control APC", code: 0x009f }, |
| 27 | + { name: "ZWSP", code: 0x200b }, |
| 28 | + { name: "ZWNJ", code: 0x200c }, |
| 29 | + { name: "ZWJ", code: 0x200d }, |
| 30 | + { name: "LRE", code: 0x202a }, |
| 31 | + { name: "RLE", code: 0x202b }, |
| 32 | + { name: "PDF", code: 0x202c }, |
| 33 | + { name: "LRO", code: 0x202d }, |
| 34 | + { name: "RLO", code: 0x202e }, |
| 35 | + { name: "LRI", code: 0x2066 }, |
| 36 | + { name: "RLI", code: 0x2067 }, |
| 37 | + { name: "FSI", code: 0x2068 }, |
| 38 | + { name: "PDI", code: 0x2069 }, |
| 39 | + { name: "BOM / ZWNBSP", code: 0xfeff }, |
| 40 | + ] as const)("strips $name", ({ code }) => { |
| 41 | + const input = `pre${c(code)}post.txt`; |
| 42 | + expect(stripFilenameControlChars(input)).toBe("prepost.txt"); |
| 43 | + }); |
| 44 | + |
| 45 | + it("collapses bidi-spoofed extensions to their visible byte order", () => { |
| 46 | + // "report" + RLO + "gpj.exe" displays as "reportexe.jpg" on bidi-aware |
| 47 | + // clients but the underlying bytes end in .exe. After stripping RLO the |
| 48 | + // visible name matches the bytes. |
| 49 | + const input = `report${c(0x202e)}gpj.exe`; |
| 50 | + expect(stripFilenameControlChars(input)).toBe("reportgpj.exe"); |
| 51 | + }); |
| 52 | + |
| 53 | + it("returns an empty string when every character is stripped", () => { |
| 54 | + const allControl = `${c(0x0000)}${c(0x202e)}${c(0xfeff)}${c(0x200b)}`; |
| 55 | + expect(stripFilenameControlChars(allControl)).toBe(""); |
| 56 | + }); |
| 57 | + |
| 58 | + it("returns an empty string for empty input", () => { |
| 59 | + expect(stripFilenameControlChars("")).toBe(""); |
| 60 | + }); |
| 61 | + |
| 62 | + it("leaves printable Unicode outside the strip ranges intact", () => { |
| 63 | + // U+200E (LRM), U+200F (RLM), and U+202F (NARROW NO-BREAK SPACE) sit |
| 64 | + // just outside the strip ranges; preserve them so this helper does not |
| 65 | + // silently drift into broader filename normalization. |
| 66 | + const input = `a${c(0x200e)}b${c(0x200f)}c${c(0x202f)}d`; |
| 67 | + expect(stripFilenameControlChars(input)).toBe(input); |
| 68 | + }); |
| 69 | +}); |
0 commit comments