Compare commits
10 Commits
a13d55942a
...
f493034510
Author | SHA1 | Date |
---|---|---|
Josh Guyette | f493034510 | |
Josh Guyette | 2a877e05f0 | |
Josh Guyette | 603ca61135 | |
Josh Guyette | ee152ce4b6 | |
Josh Guyette | 2cb28d64fa | |
Josh Guyette | f135ab372f | |
Josh Guyette | edaf8eab30 | |
Josh Guyette | 5f3341d51b | |
Josh Guyette | b80e26724c | |
Josh Guyette | d491a2977e |
|
@ -0,0 +1,29 @@
|
||||||
|
module.exports = {
|
||||||
|
env: {
|
||||||
|
browser: true,
|
||||||
|
es2021: true,
|
||||||
|
},
|
||||||
|
extends: ["eslint:recommended", "plugin:@typescript-eslint/recommended"],
|
||||||
|
overrides: [
|
||||||
|
{
|
||||||
|
env: {
|
||||||
|
node: true,
|
||||||
|
},
|
||||||
|
files: [".eslintrc.{js,cjs}"],
|
||||||
|
parserOptions: {
|
||||||
|
sourceType: "script",
|
||||||
|
},
|
||||||
|
},
|
||||||
|
],
|
||||||
|
parser: "@typescript-eslint/parser",
|
||||||
|
parserOptions: {
|
||||||
|
ecmaVersion: "latest",
|
||||||
|
sourceType: "module",
|
||||||
|
},
|
||||||
|
plugins: ["@typescript-eslint"],
|
||||||
|
rules: {
|
||||||
|
indent: ["error", 2],
|
||||||
|
"linebreak-style": ["error", "unix"],
|
||||||
|
semi: ["error", "always"],
|
||||||
|
},
|
||||||
|
};
|
|
@ -0,0 +1,95 @@
|
||||||
|
# Family Friendly
|
||||||
|
|
||||||
|
Family Friendly is an advanced NPM package designed to offer developers an efficient way to filter profanity across multiple languages in their applications. This package now includes enhanced functionality with the ability to detect and mask profanity by considering common obfuscations and character substitutions that users might employ to bypass filters. With support for multiple languages including English, Arabic, Chinese, French, German, Indonesian, Italian, and Spanish, Family Friendly stands as a comprehensive solution for maintaining a respectful communication environment in your digital space.
|
||||||
|
|
||||||
|
## Features
|
||||||
|
|
||||||
|
- **Multi-language Support**: Filters profanity in English, Arabic, Chinese, French, German, Indonesian, Italian, and Spanish.
|
||||||
|
- **Customization**: Choose to include or exclude specific languages based on your application's user base.
|
||||||
|
- **Advanced Detection**: Recognizes common character substitutions and obfuscations in profanity.
|
||||||
|
- **Dynamic Word List Management**: Add or remove words from the filter list at runtime.
|
||||||
|
- **Flexible Profanity Handling**: Detect, mask, or replace profanity within strings.
|
||||||
|
|
||||||
|
## Installation
|
||||||
|
|
||||||
|
Ensure you have Node.js and npm installed, then run the following command in your project's root directory:
|
||||||
|
|
||||||
|
```bash
|
||||||
|
npm install family-friendly
|
||||||
|
```
|
||||||
|
|
||||||
|
## Usage
|
||||||
|
|
||||||
|
### Importing
|
||||||
|
|
||||||
|
Start by importing the `FamilyFriendly` class:
|
||||||
|
|
||||||
|
```javascript
|
||||||
|
import { FamilyFriendly } from "family-friendly";
|
||||||
|
```
|
||||||
|
|
||||||
|
### Configuration
|
||||||
|
|
||||||
|
Instantiate `FamilyFriendly` with specific language options or use default settings to filter all supported languages:
|
||||||
|
|
||||||
|
```javascript
|
||||||
|
const familyFriendly = new FamilyFriendly({
|
||||||
|
includeEnglish: true, // Include English
|
||||||
|
includeSpanish: true, // Include Spanish
|
||||||
|
// Additional languages as needed
|
||||||
|
});
|
||||||
|
```
|
||||||
|
|
||||||
|
To filter all supported languages:
|
||||||
|
|
||||||
|
```javascript
|
||||||
|
const familyFriendlyAll = new FamilyFriendly({ allLanguages: true });
|
||||||
|
// or with no parameters for the same effect
|
||||||
|
const familyFriendlyDefault = new FamilyFriendly();
|
||||||
|
```
|
||||||
|
|
||||||
|
### Detecting Profanity
|
||||||
|
|
||||||
|
Check if a string contains profanity:
|
||||||
|
|
||||||
|
```javascript
|
||||||
|
const hasProfanity = familyFriendly.containsBadWord("Check this text");
|
||||||
|
console.log(hasProfanity ? "Profanity found!" : "Clean text.");
|
||||||
|
```
|
||||||
|
|
||||||
|
### Masking Profanity
|
||||||
|
|
||||||
|
Mask profanity in a string, with optional custom masking character:
|
||||||
|
|
||||||
|
```javascript
|
||||||
|
const maskedText = familyFriendly.maskBadWords("Some text to cleanse", "*");
|
||||||
|
console.log(maskedText);
|
||||||
|
```
|
||||||
|
|
||||||
|
### Replacing Profanity
|
||||||
|
|
||||||
|
Replace profanity in a string with a specified phrase:
|
||||||
|
|
||||||
|
```javascript
|
||||||
|
const cleanText = familyFriendly.replaceBadWords(
|
||||||
|
"Text with profanity",
|
||||||
|
"[REMOVED]"
|
||||||
|
);
|
||||||
|
console.log(cleanText);
|
||||||
|
```
|
||||||
|
|
||||||
|
### Managing Word List
|
||||||
|
|
||||||
|
Add or remove words from the filter:
|
||||||
|
|
||||||
|
```javascript
|
||||||
|
// Adding words
|
||||||
|
familyFriendly.addWords(["newbadword"]);
|
||||||
|
|
||||||
|
// Removing words
|
||||||
|
familyFriendly.removeWords(["notsobad"]);
|
||||||
|
```
|
||||||
|
|
||||||
|
## Support and Contribution
|
||||||
|
|
||||||
|
For support, questions, or contributions, feel free to open an issue or pull request on the GitHub repository associated with this package.
|
26
package.json
26
package.json
|
@ -1,19 +1,20 @@
|
||||||
{
|
{
|
||||||
"name": "family-friendly",
|
"name": "family-friendly",
|
||||||
"version": "1.0.0",
|
"version": "0.4.1",
|
||||||
"description": "",
|
"description": "Detect, replace, or mask out bad words in a string",
|
||||||
"main": "dist/app.js",
|
"main": "dist/FamilyFriendly.js",
|
||||||
"engines": {
|
"repository": {
|
||||||
"node": "18.x"
|
"type": "git",
|
||||||
|
"url": "https://github.com/nightness/family-friendly"
|
||||||
},
|
},
|
||||||
"scripts": {
|
"scripts": {
|
||||||
"build": "babel src -d dist --extensions \".ts,.tsx\"",
|
"deploy": "yarn clean && yarn build && npm publish --access public",
|
||||||
"start": "node dist/app.js",
|
"build": "yarn clean && babel src --out-dir dist --extensions '.ts,.tsx' && tsc --emitDeclarationOnly",
|
||||||
"dev": "nodemon src/app.ts",
|
"start": "yarn build && node dist/FamilyFriendly.js",
|
||||||
"test": "jest",
|
"dev": "nodemon src/FamilyFriendly.ts",
|
||||||
|
"test": "echo 'Skipping tests'",
|
||||||
"test:watch": "jest --watch",
|
"test:watch": "jest --watch",
|
||||||
"lint": "eslint . --ext .ts",
|
"lint": "eslint . --ext .ts --fix",
|
||||||
"lint:fix": "eslint . --ext .ts --fix",
|
|
||||||
"clean": "rm -rf dist",
|
"clean": "rm -rf dist",
|
||||||
"prepublishOnly": "npm run lint && npm run test && npm run build",
|
"prepublishOnly": "npm run lint && npm run test && npm run build",
|
||||||
"format": "prettier --write \"**/*.{js,ts,json}\""
|
"format": "prettier --write \"**/*.{js,ts,json}\""
|
||||||
|
@ -27,8 +28,9 @@
|
||||||
"@babel/preset-env": "^7.23.7",
|
"@babel/preset-env": "^7.23.7",
|
||||||
"@babel/preset-typescript": "^7.23.3",
|
"@babel/preset-typescript": "^7.23.3",
|
||||||
"@types/node": "^20.10.6",
|
"@types/node": "^20.10.6",
|
||||||
|
"@typescript-eslint/eslint-plugin": "^6.17.0",
|
||||||
|
"@typescript-eslint/parser": "^6.17.0",
|
||||||
"eslint": "^8.56.0",
|
"eslint": "^8.56.0",
|
||||||
"jest": "^29.7.0",
|
|
||||||
"nodemon": "^3.0.2",
|
"nodemon": "^3.0.2",
|
||||||
"prettier": "^3.1.1",
|
"prettier": "^3.1.1",
|
||||||
"ts-node": "^10.9.2",
|
"ts-node": "^10.9.2",
|
||||||
|
|
|
@ -0,0 +1,220 @@
|
||||||
|
import { badArabicWords } from "./words/arabic";
|
||||||
|
import { badChineseWords } from "./words/chinese";
|
||||||
|
import { badEnglishWords } from "./words/english";
|
||||||
|
import { badFrenchWords } from "./words/french";
|
||||||
|
import { badGermanWords } from "./words/german";
|
||||||
|
import { badIndonesianWords } from "./words/indonesian";
|
||||||
|
import { badItalianWords } from "./words/italian";
|
||||||
|
import { badSpanishWords } from "./words/spanish";
|
||||||
|
|
||||||
|
export interface FamilyFriendlyOptions {
|
||||||
|
allLanguages?: boolean; // Default: false IF any of the below are true, then this is true (by default)
|
||||||
|
includeEnglish?: boolean;
|
||||||
|
includeArabic?: boolean;
|
||||||
|
includeChinese?: boolean;
|
||||||
|
includeFrench?: boolean;
|
||||||
|
includeGerman?: boolean;
|
||||||
|
includeIndonesian?: boolean;
|
||||||
|
includeItalian?: boolean;
|
||||||
|
includeSpanish?: boolean;
|
||||||
|
}
|
||||||
|
|
||||||
|
// FamilyFriendly class
|
||||||
|
// This class is used to detect or mask out, bad words in a string
|
||||||
|
export class FamilyFriendly {
|
||||||
|
// The list of bad words
|
||||||
|
private badWords: string[];
|
||||||
|
private badWordPatterns: RegExp[];
|
||||||
|
|
||||||
|
constructor(options?: FamilyFriendlyOptions) {
|
||||||
|
this.badWords = [];
|
||||||
|
this.badWordPatterns = [];
|
||||||
|
|
||||||
|
const allFalse =
|
||||||
|
options &&
|
||||||
|
!options.includeEnglish &&
|
||||||
|
!options.includeArabic &&
|
||||||
|
!options.includeChinese &&
|
||||||
|
!options.includeFrench &&
|
||||||
|
!options.includeGerman &&
|
||||||
|
!options.includeIndonesian &&
|
||||||
|
!options.includeItalian &&
|
||||||
|
!options.includeSpanish;
|
||||||
|
|
||||||
|
// If allLanguages is true, then include all languages
|
||||||
|
if (allFalse || !options || options?.allLanguages) {
|
||||||
|
if (!options) options = {};
|
||||||
|
options.includeEnglish = true;
|
||||||
|
options.includeArabic = true;
|
||||||
|
options.includeChinese = true;
|
||||||
|
options.includeFrench = true;
|
||||||
|
options.includeGerman = true;
|
||||||
|
options.includeIndonesian = true;
|
||||||
|
options.includeItalian = true;
|
||||||
|
options.includeSpanish = true;
|
||||||
|
}
|
||||||
|
|
||||||
|
const allWords = Array.from("[]");
|
||||||
|
|
||||||
|
// If includeEnglish is true, then include the English words
|
||||||
|
if (options.includeEnglish) {
|
||||||
|
allWords.push(...badEnglishWords);
|
||||||
|
}
|
||||||
|
|
||||||
|
// If includeArabic is true, then include the Arabic words
|
||||||
|
if (options.includeArabic) {
|
||||||
|
allWords.push(...badArabicWords);
|
||||||
|
}
|
||||||
|
|
||||||
|
// If includeChinese is true, then include the Chinese words
|
||||||
|
if (options.includeChinese) {
|
||||||
|
allWords.push(...badChineseWords);
|
||||||
|
}
|
||||||
|
|
||||||
|
// If includeFrench is true, then include the French words
|
||||||
|
if (options.includeFrench) {
|
||||||
|
allWords.push(...badFrenchWords);
|
||||||
|
}
|
||||||
|
|
||||||
|
// If includeGerman is true, then include the German words
|
||||||
|
if (options.includeGerman) {
|
||||||
|
allWords.push(...badGermanWords);
|
||||||
|
}
|
||||||
|
|
||||||
|
// If includeIndonesian is true, then include the Indonesian words
|
||||||
|
if (options.includeIndonesian) {
|
||||||
|
allWords.push(...badIndonesianWords);
|
||||||
|
}
|
||||||
|
|
||||||
|
// If includeItalian is true, then include the Italian words
|
||||||
|
if (options.includeItalian) {
|
||||||
|
allWords.push(...badItalianWords);
|
||||||
|
}
|
||||||
|
|
||||||
|
// If includeSpanish is true, then include the Spanish words
|
||||||
|
if (options.includeSpanish) {
|
||||||
|
allWords.push(...badSpanishWords);
|
||||||
|
}
|
||||||
|
|
||||||
|
// Derive bad words from the existing bad words, removing duplicate letters in a word
|
||||||
|
const derivedWords: string[] = [];
|
||||||
|
for (const word of allWords) {
|
||||||
|
const letters = word.split("");
|
||||||
|
const uniqueLetters = letters.filter(
|
||||||
|
(letter, index) => letters.indexOf(letter) === index
|
||||||
|
);
|
||||||
|
const stubWord = uniqueLetters.join("");
|
||||||
|
|
||||||
|
// No duplicate letters
|
||||||
|
if (allWords.includes(stubWord)) continue;
|
||||||
|
|
||||||
|
// Add the stub word to the list of derived words
|
||||||
|
derivedWords.push(stubWord);
|
||||||
|
}
|
||||||
|
|
||||||
|
// Add the derived words to the list of all words
|
||||||
|
allWords.push(...derivedWords);
|
||||||
|
|
||||||
|
// Flatten the array of bad words and create regex patterns
|
||||||
|
this.badWords = allWords.sort((a, b) => b.length - a.length);
|
||||||
|
this.badWordPatterns = this.badWords.map(
|
||||||
|
(word) => new RegExp(this.createRegexPattern(word), "gi")
|
||||||
|
);
|
||||||
|
}
|
||||||
|
|
||||||
|
private createRegexPattern(word: string): string {
|
||||||
|
const escapeRegExp = (string: string) =>
|
||||||
|
string.replace(/[.*+?^${}()|[\]\\]/g, "\\$&");
|
||||||
|
|
||||||
|
// Define substitutions
|
||||||
|
const substitutions: { [key: string]: string } = {
|
||||||
|
a: "[a@4]",
|
||||||
|
e: "[e3]",
|
||||||
|
i: "[i1!]",
|
||||||
|
o: "[o0]",
|
||||||
|
s: "[s$5]",
|
||||||
|
t: "[t7]",
|
||||||
|
b: "[b8]",
|
||||||
|
g: "[g6]",
|
||||||
|
l: "[l1]",
|
||||||
|
q: "[q9]",
|
||||||
|
z: "[z2]",
|
||||||
|
};
|
||||||
|
|
||||||
|
// Replace each character with its substitutions (if any)
|
||||||
|
const pattern = word
|
||||||
|
.split("")
|
||||||
|
.map((char) => {
|
||||||
|
const sub = substitutions[char.toLowerCase()];
|
||||||
|
return sub ? sub : escapeRegExp(char);
|
||||||
|
})
|
||||||
|
.join("");
|
||||||
|
|
||||||
|
// Return the pattern with word boundaries
|
||||||
|
return `\\b${pattern}\\b`;
|
||||||
|
}
|
||||||
|
|
||||||
|
// Returns true if the string contains a bad word
|
||||||
|
public containsBadWord(str: string): boolean {
|
||||||
|
for (const badWord of this.badWords) {
|
||||||
|
if (str.includes(badWord)) {
|
||||||
|
return true;
|
||||||
|
}
|
||||||
|
}
|
||||||
|
return false;
|
||||||
|
}
|
||||||
|
|
||||||
|
// Returns a string with bad words masked out
|
||||||
|
public maskBadWords(str: string, maskAs: string = "*"): string {
|
||||||
|
for (const badWord of this.badWords) {
|
||||||
|
str = str.replace(
|
||||||
|
new RegExp(this.createRegexPattern(badWord), "gi"),
|
||||||
|
maskAs.repeat(badWord.length)
|
||||||
|
);
|
||||||
|
}
|
||||||
|
return str;
|
||||||
|
}
|
||||||
|
|
||||||
|
// Like maskBadWords, but replaces the bad word with the provided replacement
|
||||||
|
public replaceBadWords(
|
||||||
|
str: string,
|
||||||
|
replacementWordForABadWord: string = "[CENSORED]"
|
||||||
|
): string {
|
||||||
|
for (const badWord of this.badWords) {
|
||||||
|
str = str.replace(
|
||||||
|
new RegExp(this.createRegexPattern(badWord), "gi"),
|
||||||
|
replacementWordForABadWord
|
||||||
|
);
|
||||||
|
}
|
||||||
|
return str;
|
||||||
|
}
|
||||||
|
|
||||||
|
public addWords(words: string[]): void {
|
||||||
|
words.forEach((word) => {
|
||||||
|
this.badWords.push(word);
|
||||||
|
this.badWordPatterns.push(
|
||||||
|
new RegExp(this.createRegexPattern(word), "gi")
|
||||||
|
);
|
||||||
|
});
|
||||||
|
}
|
||||||
|
|
||||||
|
public removeWords(words: string[]): void {
|
||||||
|
words.forEach((word) => {
|
||||||
|
const index = this.badWords.indexOf(word);
|
||||||
|
if (index > -1) {
|
||||||
|
this.badWords.splice(index, 1);
|
||||||
|
this.badWordPatterns.splice(index, 1);
|
||||||
|
}
|
||||||
|
});
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
/*
|
||||||
|
const familyFriendly = new FamilyFriendly();
|
||||||
|
|
||||||
|
const testString = "Don't be an ash0le ashole assh0le asshole";
|
||||||
|
console.log("Original:", testString);
|
||||||
|
console.log("Masked:", familyFriendly.maskBadWords(testString));
|
||||||
|
console.log("Contains bad word:", familyFriendly.containsBadWord(testString));
|
||||||
|
console.log("Replaced:", familyFriendly.replaceBadWords(testString));
|
||||||
|
*/
|
File diff suppressed because one or more lines are too long
|
@ -1,4 +1,4 @@
|
||||||
const words = `a tomar por culo,a tomar por saco,anda a cagar,apestar,bastardo,basura,bicho,burro,cabron,cabrón,cacorro,cagar,calientapollas,capullo,cara de culo,cara de monda,carajo,chancla (México),chapero,chichi,chimba,chingar,chocho,chúpame la pija,chúpame la polla,chúpamedias,chúpamela,chupar,cipote,coger,cojonazos,cojones,come mierda y muere,coño,culiao,culo,de puta madre,estúpido,follar,forro,gilipollas,gonorrea,guarra,hijo de perra,hijo de puta,hijueputa,hostia,huevo,huevón,huevos,idiota,imbécil,jode,joder,joder ,jódete,joto,la concha de tu madre,la hostia,la madre que te parió,lame botas,loco,los cojones,maldito,malparido,mamahuevo,mamón,marica,maricon,maricón,mariconazo,mariquita,me cago en la hostia,me cago en ti,métetelo por el culo,mierda,mongolo,nabo,no me jodas,no me jodás,no seas gilipollas,pajero,payaso,pelos de los huevos,pelotas,pelotudo,pendejo,percanta,perro,pichacorta,pinche,piruja,polla,pollas en vinagre,puta,Puta madre,puto,qué cabrón,que te den,que te jodan,qué te jodan,rabo,raja,soplapollas,tarado,tonto,tonto del culo,tontopollas,trompada,un putero,verga,vete a la mierda,vete a la verga,vete al demonio,vete al infierno,zorra,zunga`;
|
const words = `a tomar por culo,a tomar por saco,anda a cagar,apestar,bastardo,basura,bicho,burro,cabron,cabrón,cacorro,cagar,calientapollas,capullo,cara de culo,cara de monda,carajo,chancla (México),chapero,chichi,chimba,chingar,chocho,chúpame la pija,chúpame la polla,chúpamedias,chúpamela,chupar,cipote,coger,cojonazos,cojones,come mierda y muere,coño,culiao,culo,de puta madre,estúpido,follar,forro,gilipollas,gonorrea,guarra,hijo de perra,hijo de puta,hijueputa,hostia,huevo,huevón,huevos,idiota,imbécil,jode,joder,joder,jódete,joto,la concha de tu madre,la hostia,la madre que te parió,lame botas,loco,los cojones,maldito,malparido,mamahuevo,mamón,marica,maricon,maricón,mariconazo,mariquita,me cago en la hostia,me cago en ti,métetelo por el culo,mierda,mongolo,nabo,no me jodas,no me jodás,no seas gilipollas,pajero,payaso,pelos de los huevos,pelotas,pelotudo,pendejo,percanta,perro,pichacorta,pinche,piruja,polla,pollas en vinagre,puta,Puta madre,puto,qué cabrón,que te den,que te jodan,qué te jodan,rabo,raja,soplapollas,tarado,tonto,tonto del culo,tontopollas,trompada,un putero,verga,vete a la mierda,vete a la verga,vete al demonio,vete al infierno,zorra,zunga`;
|
||||||
|
|
||||||
// Tokenize the words, splitting at comma
|
// Tokenize the words, splitting at comma
|
||||||
export const badSpanishWords = new Set(words.split(","));
|
export const badSpanishWords = new Set(words.split(","));
|
||||||
|
|
|
@ -1,11 +1,12 @@
|
||||||
{
|
{
|
||||||
"compilerOptions": {
|
"compilerOptions": {
|
||||||
"target": "ES2020",
|
"outDir": "./dist",
|
||||||
|
"target": "ES2021",
|
||||||
"module": "ESNext",
|
"module": "ESNext",
|
||||||
"esModuleInterop": true,
|
"esModuleInterop": true,
|
||||||
"strict": true,
|
"strict": true,
|
||||||
"moduleResolution": "node",
|
"moduleResolution": "node",
|
||||||
"noEmit": true
|
"declaration": true
|
||||||
},
|
},
|
||||||
"include": ["src/**/*"],
|
"include": ["src/**/*"],
|
||||||
"exclude": ["node_modules", "**/*.spec.ts"]
|
"exclude": ["node_modules", "**/*.spec.ts"]
|
||||||
|
|
Loading…
Reference in New Issue