From 22175dc6648985c8b7f54a3f0b3c3e6e3a66684e Mon Sep 17 00:00:00 2001 From: Fityan Date: Tue, 14 Nov 2023 10:01:55 +0700 Subject: [PATCH 1/4] feat: add support for custom charSets and multiple charSets --- src/index.ts | 48 ++++++++++++++++++++---- test/index.spec.ts | 91 +++++++++++++++++++++++++++++++++++++++++++--- 2 files changed, 127 insertions(+), 12 deletions(-) diff --git a/src/index.ts b/src/index.ts index 59eb8c0..f9bd010 100644 --- a/src/index.ts +++ b/src/index.ts @@ -2,12 +2,21 @@ import fs from 'node:fs'; import path from 'node:path'; import { fileURLToPath } from 'node:url'; -export type CharSetNames = 'latin' | 'latin-1'; +export const CharSets = { + LATIN: 'latin', + LATIN_1: 'latin-1', +} as const; +export type CharSetNames = typeof CharSets[keyof typeof CharSets]; export type CharSet = Record; const dirname = path.dirname(fileURLToPath(import.meta.url)); function getCharSet(name: CharSetNames = 'latin'): CharSet { + // Validating the name + if (!Object.values(CharSets).includes(name)) { + throw new Error(`Invalid charSet name: ${name}`); + } + const strJson = fs.readFileSync( path.resolve(dirname, `../charsets/${name}.json`), { encoding: 'utf8' }, @@ -15,12 +24,37 @@ function getCharSet(name: CharSetNames = 'latin'): CharSet { return JSON.parse(strJson) as CharSet; } -function getChar(char: string, charSet: CharSet, caseSensitive?: boolean) { - const upperReplacements = charSet[char.toUpperCase()] ?? []; - const lowerReplacements = charSet[char.toLowerCase()] ?? []; +export function mergeCharSets(...charSets: (CharSetNames | CharSet)[]): CharSet { + const res: CharSet = {}; + + for (const charSet of charSets) { + const charSetObj = typeof charSet === 'string' ? getCharSet(charSet) : charSet; + // Validate the charSet + if ( + Object.keys(charSetObj).some((char) => char.length !== 1) + || Object.values(charSetObj).some((replacements) => replacements?.some((replacement) => replacement.length !== 1)) + ) { + throw new Error('Invalid charSet: each key and value must be a single character'); + } + + for (const [char, replacements] of Object.entries(charSetObj)) { + res[char] = Array.from(new Set([ + ...(res[char] ?? []), + ...(replacements ?? []), + ])); + } + } + + return res; +} + +function getChar(char: string, charSet: CharSet, caseSensitive?: boolean) { const replacements = caseSensitive ? charSet[char] ?? [] - : Array.from(new Set([...upperReplacements, ...lowerReplacements])); + : Array.from(new Set([ + ...(charSet[char.toUpperCase()] ?? []), + ...(charSet[char.toLowerCase()] ?? []), + ])); if (!replacements.length) { return char; @@ -33,11 +67,11 @@ export type Options = { text: string; phrases?: string[]; caseSensitive?: boolean; - charSet?: CharSetNames; + charSets?: (CharSetNames | CharSet)[]; }; export default function wisely(options: Options): string { - const charSet = getCharSet(options.charSet); + const charSet = mergeCharSets(...(options.charSets ?? ['latin'])); const censor = (phrase: string): string => phrase.split('') .map((char) => getChar(char, charSet, options.caseSensitive)) diff --git a/test/index.spec.ts b/test/index.spec.ts index e8bf514..ecea049 100644 --- a/test/index.spec.ts +++ b/test/index.spec.ts @@ -1,5 +1,6 @@ +/* eslint-disable @typescript-eslint/ban-ts-comment */ import { describe, expect, test } from 'vitest'; -import wisely from '~/index.js'; +import wisely, { Options, mergeCharSets } from '~/index.js'; describe('wisely', () => { const text = 'Palestine will be free! Freedom is the right of ALL nations!'; @@ -55,10 +56,29 @@ describe('wisely', () => { expect(wisely({ text, phrases: [] })).toEqual(text); }); - test.each([ - { testText: 'AaBbCcDdXxZz', contains: '\u00df\u00d7Zz', notContains: 'AaBbCcDdXx' }, - ])('with specific charSet (latin-1): $testText', ({ testText, contains, notContains }) => { - const result = wisely({ text: testText, charSet: 'latin-1' }); + test.each<{ testText: string, charSets: Options['charSets'], contains: string, notContains: string }>([ + { + charSets: ['latin-1'], + testText: 'AaBbCcDdXxZz', + contains: '\u00df\u00d7Zz', + notContains: 'AaBbCcDdXx', + }, + { + charSets: ['latin', 'latin-1'], + testText: 'AaBbCcDdXxZz', + contains: '\u00d72', + notContains: 'AaBbCcDdXxZz', + }, + { + charSets: [{ a: ['b', 'c'], x: ['y', 'z'] }], + testText: 'AaBbCcDdXxZz', + contains: 'BbCcDdZz', + notContains: 'AaXx', + }, + ])('with specific charSet $charSets: $testText', ({ + testText, charSets, contains, notContains, + }) => { + const result = wisely({ text: testText, charSets }); contains.split('').forEach((char) => { expect(result).contain(char); @@ -71,3 +91,64 @@ describe('wisely', () => { expect(result).toHaveLength(testText.length); }); }); + +describe('mergeCharSets', () => { + test('merge two charSets', () => { + const charSet1 = { a: ['b', 'c'], x: ['y', 'z'] }; + const charSet2 = { a: ['c', 'd', 'e'], X: ['Y', 'Z'] }; + + expect(mergeCharSets(charSet1, charSet2)).toEqual({ + a: ['b', 'c', 'd', 'e'], + x: ['y', 'z'], + X: ['Y', 'Z'], + }); + }); + + test('merge three charSets', () => { + const charSet1 = { a: ['b', 'c'], x: ['y', 'z'] }; + const charSet2 = { a: ['c', 'd', 'e'], X: ['Y', 'Z'] }; + const charSet3 = { a: ['e', 'f', 'g'], A: ['B', 'C'] }; + + expect(mergeCharSets(charSet1, charSet2, charSet3)).toEqual({ + a: ['b', 'c', 'd', 'e', 'f', 'g'], + A: ['B', 'C'], + x: ['y', 'z'], + X: ['Y', 'Z'], + }); + }); + + test('merge charSet with charSetNames', () => { + const charSet1 = { a: ['b', 'c'], x: ['y', 'z'] }; + + expect(mergeCharSets(charSet1, 'latin')).toEqual( + expect.objectContaining({ + A: ['4'], + a: ['b', 'c', '@'], + x: ['y', 'z'], + Z: ['2'], + }), + ); + }); + + test('duplicate charSetNames', () => { + expect(mergeCharSets('latin', 'latin')).toEqual( + expect.objectContaining({ + A: ['4'], a: ['@'], B: ['8'], b: ['6'], Z: ['2'], + }), + ); + }); + + test('Unknown charSetNames', () => { + // @ts-expect-error + expect(() => mergeCharSets('')).toThrow(); + // @ts-expect-error + expect(() => mergeCharSets('x')).toThrow(); + }); + + test('Invalid custom charSet', () => { + expect(() => mergeCharSets({ aa: ['b', 'c', 'd'] })).toThrow(); + expect(() => mergeCharSets({ a: ['bc'] })).toThrow(); + expect(() => mergeCharSets({ a: ['b', 'c', ''] })).toThrow(); + expect(() => mergeCharSets({ a: ['b', 'c', 'd', ''] })).toThrow(); + }); +}); From feaff05f72eea4c544d97845b380c254f5c09cd7 Mon Sep 17 00:00:00 2001 From: Fityan Date: Tue, 14 Nov 2023 10:57:40 +0700 Subject: [PATCH 2/4] sort the replacement chars, update the docs, update tests --- README.md | 50 ++++++++++----- charsets/latin-1.json | 2 +- src/index.ts | 3 +- test/index.spec.ts | 140 ++++++++++++++++++++++++------------------ 4 files changed, 117 insertions(+), 78 deletions(-) diff --git a/README.md b/README.md index d15fd65..cf125dd 100644 --- a/README.md +++ b/README.md @@ -36,7 +36,7 @@ console.log(res1, res2); ## API -### wisely(options) +### `wisely(options)` Returns a `string` with the obsfucated text. @@ -46,41 +46,61 @@ Type: `object` ##### text -Type: `string` -Required: `true` +- Type: `string` +- Required: `true` The text to be obscured. ##### phrases -Type: `string[]` \ -Required: `false` +- Type: `string[]` +- Required: `false` The specific phrases to be obscured. If not specified, the whole text will be obscured. ##### caseSensitive -Type: `boolean` \ -Default: `false` +- Type: `boolean` +- Default: `false` Whether to obscure in a case-sensitive manner. -##### charSet +##### charSets -Type: `string` \ -Default: `'latin'` \ -Values: `'latin'` | `'latin-1'` +- Type: `(string | object)[]` +- Default: `['latin']` -The character set that will be used for obfuscation. +The character set that will be used for obfuscation. Put the **name of the** [**built-in character sets**](#character-sets) or a **custom character set objects**. -> In the future, we will add support for more character sets to improve the variety of the obsfucated text. Also, we will add support to define custom character sets. +The custom character set object must be an object that **each key is a single character** and **each value is an array of single characters** that will be used to replace the key. See the example below. + +```js +const customCharSet = { + a: ['@', '4'], + e: ['3'], + i: ['1', '!'], + o: ['0'], + s: ['5', '$'], + t: ['7'], +}; +``` + +### `mergeCharSets(...charSets)` + +Returns a merged character set object. + +#### charSets + +Type: `string | object` + +The character set that will be merged. Put the **name of the** [**built-in character sets**](#character-sets) or a **custom character set objects**. ## Character Sets Below is the built-in character sets available. See the details of each character set in the [charsets](./charsets) directory. -| `charSet` | Block Name | Block Range | -| ---- | --------- | ----- | +| `charSet` Name | Block Name | Block Range | +| --- | --- | --- | | `latin` | [Basic Latin](https://unicodeplus.com/block/0000) | \u0000 - \u007f | | `latin-1` | [Latin-1 Supplement](https://unicodeplus.com/block/0080) | \u0080 - \u00ff | diff --git a/charsets/latin-1.json b/charsets/latin-1.json index 1014c83..38a6082 100644 --- a/charsets/latin-1.json +++ b/charsets/latin-1.json @@ -1,6 +1,6 @@ { "A": ["\u00c0", "\u00c1", "\u00c2", "\u00c3", "\u00c4", "\u00c5"], - "a": ["\u00e0", "\u00e1", "\u00e2", "\u00e3", "\u00e4", "\u00e5", "\u00aa"], + "a": ["\u00aa", "\u00e0", "\u00e1", "\u00e2", "\u00e3", "\u00e4", "\u00e5"], "B": ["\u00df"], "C": ["\u00a2", "\u00a9", "\u00c7"], "c": ["\u00e7"], diff --git a/src/index.ts b/src/index.ts index f9bd010..93662ab 100644 --- a/src/index.ts +++ b/src/index.ts @@ -21,6 +21,7 @@ function getCharSet(name: CharSetNames = 'latin'): CharSet { path.resolve(dirname, `../charsets/${name}.json`), { encoding: 'utf8' }, ); + return JSON.parse(strJson) as CharSet; } @@ -42,7 +43,7 @@ export function mergeCharSets(...charSets: (CharSetNames | CharSet)[]): CharSet res[char] = Array.from(new Set([ ...(res[char] ?? []), ...(replacements ?? []), - ])); + ])).sort(); } } diff --git a/test/index.spec.ts b/test/index.spec.ts index ecea049..0183989 100644 --- a/test/index.spec.ts +++ b/test/index.spec.ts @@ -2,6 +2,85 @@ import { describe, expect, test } from 'vitest'; import wisely, { Options, mergeCharSets } from '~/index.js'; +describe('mergeCharSets', () => { + test('merge two built-in charSets', () => { + const mergedCharSet = mergeCharSets('latin', 'latin-1'); + + expect(mergedCharSet).toEqual( + expect.objectContaining({ + A: ['4', '\u00c0', '\u00c1', '\u00c2', '\u00c3', '\u00c4', '\u00c5'], + a: ['@', '\u00aa', '\u00e0', '\u00e1', '\u00e2', '\u00e3', '\u00e4', '\u00e5'], + }), + ); + }); + + test('merge built-in charSets with custom charSets', () => { + const customCharSet = { a: ['b', 'c'], x: ['y', 'z'] }; + + expect(mergeCharSets('latin', customCharSet)).toEqual( + expect.objectContaining({ + A: ['4'], + a: ['@', 'b', 'c'], + x: ['y', 'z'], + Z: ['2'], + }), + ); + }); + + test('merge two custom charSets', () => { + const charSet1 = { a: ['b', 'c'], x: ['y', 'z'] }; + const charSet2 = { a: ['c', 'd', 'e'], X: ['Y', 'Z'] }; + + expect(mergeCharSets(charSet1, charSet2)).toEqual({ + a: ['b', 'c', 'd', 'e'], + x: ['y', 'z'], + X: ['Y', 'Z'], + }); + }); + + test('charSet order should not affect the result', () => { + const customCharSet = { a: ['4', '@'] }; + + expect(mergeCharSets('latin', 'latin-1')).toEqual(mergeCharSets('latin-1', 'latin')); + expect(mergeCharSets('latin', customCharSet)).toEqual(mergeCharSets(customCharSet, 'latin')); + }); + + test('merge three custom charSets', () => { + const charSet1 = { a: ['b', 'c'], x: ['y', 'z'] }; + const charSet2 = { a: ['c', 'd', 'e'], X: ['Y', 'Z'] }; + const charSet3 = { a: ['e', 'f', 'g'], A: ['B', 'C'] }; + + expect(mergeCharSets(charSet1, charSet2, charSet3)).toEqual({ + a: ['b', 'c', 'd', 'e', 'f', 'g'], + A: ['B', 'C'], + x: ['y', 'z'], + X: ['Y', 'Z'], + }); + }); + + test('duplicate built-in charSets names', () => { + expect(mergeCharSets('latin', 'latin')).toEqual( + expect.objectContaining({ + A: ['4'], a: ['@'], B: ['8'], b: ['6'], Z: ['2'], + }), + ); + }); + + test('unknown charSets names', () => { + // @ts-expect-error + expect(() => mergeCharSets('')).toThrow(); + // @ts-expect-error + expect(() => mergeCharSets('x')).toThrow(); + }); + + test('invalid custom charSets', () => { + expect(() => mergeCharSets({ aa: ['b', 'c', 'd'] })).toThrow(); + expect(() => mergeCharSets({ a: ['bc'] })).toThrow(); + expect(() => mergeCharSets({ a: ['b', 'c', ''] })).toThrow(); + expect(() => mergeCharSets({ a: ['b', 'c', 'd', ''] })).toThrow(); + }); +}); + describe('wisely', () => { const text = 'Palestine will be free! Freedom is the right of ALL nations!'; @@ -91,64 +170,3 @@ describe('wisely', () => { expect(result).toHaveLength(testText.length); }); }); - -describe('mergeCharSets', () => { - test('merge two charSets', () => { - const charSet1 = { a: ['b', 'c'], x: ['y', 'z'] }; - const charSet2 = { a: ['c', 'd', 'e'], X: ['Y', 'Z'] }; - - expect(mergeCharSets(charSet1, charSet2)).toEqual({ - a: ['b', 'c', 'd', 'e'], - x: ['y', 'z'], - X: ['Y', 'Z'], - }); - }); - - test('merge three charSets', () => { - const charSet1 = { a: ['b', 'c'], x: ['y', 'z'] }; - const charSet2 = { a: ['c', 'd', 'e'], X: ['Y', 'Z'] }; - const charSet3 = { a: ['e', 'f', 'g'], A: ['B', 'C'] }; - - expect(mergeCharSets(charSet1, charSet2, charSet3)).toEqual({ - a: ['b', 'c', 'd', 'e', 'f', 'g'], - A: ['B', 'C'], - x: ['y', 'z'], - X: ['Y', 'Z'], - }); - }); - - test('merge charSet with charSetNames', () => { - const charSet1 = { a: ['b', 'c'], x: ['y', 'z'] }; - - expect(mergeCharSets(charSet1, 'latin')).toEqual( - expect.objectContaining({ - A: ['4'], - a: ['b', 'c', '@'], - x: ['y', 'z'], - Z: ['2'], - }), - ); - }); - - test('duplicate charSetNames', () => { - expect(mergeCharSets('latin', 'latin')).toEqual( - expect.objectContaining({ - A: ['4'], a: ['@'], B: ['8'], b: ['6'], Z: ['2'], - }), - ); - }); - - test('Unknown charSetNames', () => { - // @ts-expect-error - expect(() => mergeCharSets('')).toThrow(); - // @ts-expect-error - expect(() => mergeCharSets('x')).toThrow(); - }); - - test('Invalid custom charSet', () => { - expect(() => mergeCharSets({ aa: ['b', 'c', 'd'] })).toThrow(); - expect(() => mergeCharSets({ a: ['bc'] })).toThrow(); - expect(() => mergeCharSets({ a: ['b', 'c', ''] })).toThrow(); - expect(() => mergeCharSets({ a: ['b', 'c', 'd', ''] })).toThrow(); - }); -}); From 9844fbee1fad0dfa3bd27ff82e872a6a21c55f6a Mon Sep 17 00:00:00 2001 From: Fityan Date: Tue, 14 Nov 2023 11:20:27 +0700 Subject: [PATCH 3/4] refactor: add `isCharSetValid()` and test the charsets data --- src/index.ts | 10 ++++++---- test/charsets.spec.ts | 17 +++++++++++++++++ 2 files changed, 23 insertions(+), 4 deletions(-) create mode 100644 test/charsets.spec.ts diff --git a/src/index.ts b/src/index.ts index 93662ab..9df8dde 100644 --- a/src/index.ts +++ b/src/index.ts @@ -25,6 +25,11 @@ function getCharSet(name: CharSetNames = 'latin'): CharSet { return JSON.parse(strJson) as CharSet; } +export function isCharSetValid(charSet: CharSet): boolean { + return !Object.keys(charSet).some((char) => char.length !== 1) + && !Object.values(charSet).some((replacements) => replacements?.some((replacement) => replacement.length !== 1)); +} + export function mergeCharSets(...charSets: (CharSetNames | CharSet)[]): CharSet { const res: CharSet = {}; @@ -32,10 +37,7 @@ export function mergeCharSets(...charSets: (CharSetNames | CharSet)[]): CharSet const charSetObj = typeof charSet === 'string' ? getCharSet(charSet) : charSet; // Validate the charSet - if ( - Object.keys(charSetObj).some((char) => char.length !== 1) - || Object.values(charSetObj).some((replacements) => replacements?.some((replacement) => replacement.length !== 1)) - ) { + if (!isCharSetValid(charSetObj)) { throw new Error('Invalid charSet: each key and value must be a single character'); } diff --git a/test/charsets.spec.ts b/test/charsets.spec.ts new file mode 100644 index 0000000..2abe1ce --- /dev/null +++ b/test/charsets.spec.ts @@ -0,0 +1,17 @@ +import fs from 'node:fs'; +import path from 'node:path'; +import { expect, test } from 'vitest'; +import { CharSet, isCharSetValid } from '~/index.js'; + +test.each([ + { name: 'latin' }, + { name: 'latin-1' }, +])('validate charSet: $name', ({ name }) => { + const strJson = fs.readFileSync( + path.resolve(__dirname, `../charsets/${name}.json`), + { encoding: 'utf8' }, + ); + + const charSet = JSON.parse(strJson) as CharSet; + expect(isCharSetValid(charSet)).toBe(true); +}); From 6f663c05aac386f7171686e69176e7a4dc3b496c Mon Sep 17 00:00:00 2001 From: Fityan Date: Tue, 14 Nov 2023 11:37:51 +0700 Subject: [PATCH 4/4] refactor: improve `isCharSetValid()` logic --- README.md | 12 +++++++++++- src/index.ts | 14 +++++++++----- 2 files changed, 20 insertions(+), 6 deletions(-) diff --git a/README.md b/README.md index cf125dd..41656a0 100644 --- a/README.md +++ b/README.md @@ -72,7 +72,7 @@ Whether to obscure in a case-sensitive manner. The character set that will be used for obfuscation. Put the **name of the** [**built-in character sets**](#character-sets) or a **custom character set objects**. -The custom character set object must be an object that **each key is a single character** and **each value is an array of single characters** that will be used to replace the key. See the example below. +The valid custom character set object must be an object that **each key is a single character** and **each value is an array of single characters** that will be used to replace the key. See the example below. ```js const customCharSet = { @@ -85,6 +85,16 @@ const customCharSet = { }; ``` +### `isCharSetValid(charSet)` + +Returns a `boolean` whether the character set is valid. + +#### charSet + +Type: `object` + +The character set that will be checked. + ### `mergeCharSets(...charSets)` Returns a merged character set object. diff --git a/src/index.ts b/src/index.ts index 9df8dde..e26dfe7 100644 --- a/src/index.ts +++ b/src/index.ts @@ -26,8 +26,12 @@ function getCharSet(name: CharSetNames = 'latin'): CharSet { } export function isCharSetValid(charSet: CharSet): boolean { - return !Object.keys(charSet).some((char) => char.length !== 1) - && !Object.values(charSet).some((replacements) => replacements?.some((replacement) => replacement.length !== 1)); + return typeof charSet === 'object' + && Object.keys(charSet).every((key) => key.length === 1) + && Object.values(charSet).every((replacements) => ( + Array.isArray(replacements) + && replacements.every((char) => char.length === 1) + )); } export function mergeCharSets(...charSets: (CharSetNames | CharSet)[]): CharSet { @@ -41,9 +45,9 @@ export function mergeCharSets(...charSets: (CharSetNames | CharSet)[]): CharSet throw new Error('Invalid charSet: each key and value must be a single character'); } - for (const [char, replacements] of Object.entries(charSetObj)) { - res[char] = Array.from(new Set([ - ...(res[char] ?? []), + for (const [key, replacements] of Object.entries(charSetObj)) { + res[key] = Array.from(new Set([ + ...(res[key] ?? []), ...(replacements ?? []), ])).sort(); }