It's not perfect but it's kind of working so far.// UserScript// @name Spam Filter for Soyjak.st// @namespace http://tampermonkey.net/// @version 2.0// @description Hide spammy posts automatically// @match *://soyjak.s

Email
Subject
Comment
File
Embed
Voice
Poll
Password	(For file deletion.)

Anti-spam filter Chud 04/18/25 (Fri) 20:04:21 №6697 [Quote]

It's not perfect but it's kind of working so far.

// UserScript
// @name Spam Filter for Soyjak.st
// @namespace http://tampermonkey.net/
// @version 2.0
// @description Hide spammy posts automatically
// @match *://soyjak.st/*
// /UserScript

const thresholds = {
repeatThreshold: 3,
densityThreshold: 0.22,
elongationThreshold: 4
};

// isElongated function
function isElongated(word, threshold) {
let charCount = 1;
for (let i = 1; i < word.length; i++) {
if (word[i] === word[i - 1]) {
charCount++;
if (charCount >= threshold) {
return true;
}
} else {
charCount = 1;
}
}
return false;
}

// isSpam function
function isSpam(message, thresholds) {
// Check for repeated words and their density
const words = message.toLowerCase().split(/\s+/);
const wordCount = {};
const totalWords = words.length;

for (const word of words) {
if (!word.trim()) continue;
if (isElongated(word, thresholds.elongationThreshold)) {
return true;
}
wordCount[word] = (wordCount[word] || 0) + 1;
}

for (const [word, count] of Object.entries(wordCount)) {
const density = count / totalWords;
if (count >= thresholds.repeatThreshold && density >= thresholds.densityThreshold) {
return true;
}
}

return false;
}

const postElements = document.querySelectorAll('div.post.reply div.body');

postElements.forEach((el) => {
const message = el.textContent.trim();
if (isSpam(message, thresholds)) {
const postContainer = el.closest('.post');
if (postContainer) {
postContainer.style.display = 'none'; // Hide the whole post
const next = postContainer.nextSibling;
if (next && next.nodeName === 'BR') {
next.remove();
}
}
}
});

Chud 04/18/25 (Fri) 20:18:26 №6708 [Quote]

File: GKXWZQWakAAGmaP.jpeg 📥︎ (213.65 KB, 960x1280) ImgOps

>>6697 (OP)
Thanks a lot

Chud 04/18/25 (Fri) 20:19:31 №6709 [Quote]

File: ClipboardImage.png 📥︎ (23.27 KB, 495x592) ImgOps

Something you can do about these type of replies?

Chud 04/18/25 (Fri) 20:21:50 №6713 [Quote]

>>6709
Working on that like rn lol.

Chud 04/18/25 (Fri) 20:25:56 №6716 [Quote]

not gonna install your chink spyware

Chud 04/18/25 (Fri) 20:27:13 №6717 [Quote]

>>6716
You don't belong here if you can't read code, baboon

Chud 04/18/25 (Fri) 20:29:58 №6719 [Quote]

File: 3255235.webm 📥︎ (25.68 MB, 720x820) ImgOps

>4gegs need scripts to handle spam so their clitties don't leak

Chud 04/18/25 (Fri) 20:30:44 №6721 [Quote]

>>6719
gotta filter out boring niggers somehow

Chud 04/18/25 (Fri) 20:34:24 №6724 [Quote]

File: 37735.png 📥︎ (60.78 KB, 318x266) ImgOps

>>>6719 (You)
>gotta filter out boring niggers somehow

Chud 04/18/25 (Fri) 20:44:49 №6733 [Quote]

File: 1721541607630790.jpg 📥︎ (436.19 KB, 2048x1536) ImgOps

>>6709
Try this, changed the isElongated function to count the letters in each word instead of just checking if the previous letter is the same as the current word in the for loop.
Didn't realize 4chan/soyjak posts are just one line with no /n.

// UserScript
// @name Spam Filter for Soyjak.st
// @version 2.1
// @description Hide spammy posts automatically
// @match *://soyjak.st/*
// /UserScript

const thresholds = {
repeatThreshold: 3,
densityThreshold: 0.22,
elongationThreshold: 3
};

// isElongated function
function isElongated(word, threshold) {
let elongation = {};
for (let i = 1; i < word.length; i++) {
elongation[word[i]] = (elongation[word[i]] || 0) + 1;
if (elongation[word[i]] >= threshold) {
console.log(word[i], 'count:', elongation[word[i]])
return true;
}
}
return false;
}

// isSpam function
function isSpam(message, thresholds) {
// Check for repeated words and their density
const words = message.toLowerCase().split(/\s+/);
const wordCount = {};
let totalWords = 0;
for (const word of words) {
if (!word.trim()) continue;
if (/^>>/.test(word)) continue;
totalWords++;

if (isElongated(word, thresholds.elongationThreshold)) {
console.log(`${word} is spam!!!`);
return true;
}
wordCount[word] = (wordCount[word] || 0) + 1;
}

for (const [word, count] of Object.entries(wordCount)) {
const density = count / totalWords;
if (count >= thresholds.repeatThreshold && density >= thresholds.densityThreshold) {
return true;
}
}

return false;
}

const postElements = document.querySelectorAll('div.post.reply div.body');

postElements.forEach((el) => {
const message = el.textContent.trim();
if (isSpam(message, thresholds)) {
const postContainer = el.closest('.post');
if (postContainer) {
postContainer.style.display = 'none'; // Hide the whole post
const next = postContainer.nextSibling;
if (next && next.nodeName === 'BR') {
next.remove();
}
}
}
});

Chud 04/18/25 (Fri) 20:50:14 №6734 [Quote]

>>6733
Oh lmfao the script even blocked this post because of this line
*://soyjak.st/*//

Chud 04/18/25 (Fri) 20:53:30 №6735 [Quote]

>>6709
GEEEEEG
COPE
>COPE
COPE
COPE
>COPE
COPE>COPE
>COPE
COPE
>COPE
COPE
>COPE
COPE

Chud 04/18/25 (Fri) 20:56:26 №6739 [Quote]

>>6733
Try mine instead

const thresholds = {
repeatThreshold: 3,
densityThreshold: 0.22,
elongationThreshold: 4
};

// isElongated function
function isElongated(word, threshold) {
let charCount = 1;
for (let i = 1; i < word.length; i++) {
if (word[i] === word[i - 1]) {
charCount++;
if (charCount >= threshold) {
return true;
}
} else {
charCount = 1;
}
}
return false;
}

// isSpam function (improved)
function isSpam(message, thresholds) {
const words = message.toLowerCase().split(/\s+/);
const wordCount = {};
const totalWords = words.length;

for (const word of words) {
if (!word.trim()) continue;
if (isElongated(word, thresholds.elongationThreshold)) {
return true;
}
wordCount[word] = (wordCount[word] || 0) + 1;
}

for (const [word, count] of Object.entries(wordCount)) {
const density = count / totalWords;
if (count >= thresholds.repeatThreshold && density >= thresholds.densityThreshold) {
return true;
}
}

// Normalize lines: remove ">", trim whitespace, lowercase
const lines = message.split('\n')
.map(line => line.replace(/^>+/, '').trim().toLowerCase())
.filter(Boolean);

const lineCount = {};
for (const line of lines) {
lineCount[line] = (lineCount[line] || 0) + 1;
}

for (const count of Object.values(lineCount)) {
if (count / lines.length >= 0.5 && lines.length > 5) {
return true; // Over 50% of lines are the same
}
}

return false;
}

// Main filtering logic
const postElements = document.querySelectorAll('div.post.reply div.body');

postElements.forEach((el) => {
const message = el.textContent.trim();
if (isSpam(message, thresholds)) {
const postContainer = el.closest('.post');
if (postContainer) {
postContainer.style.display = 'none'; // Hide the whole post
const next = postContainer.nextSibling;
if (next && next.nodeName === 'BR') {
next.remove();
}
}
}
});

Chud 04/18/25 (Fri) 20:59:12 №6742 [Quote]

Make sure the @match line at the top looks like this

// @match *://*soyjak.st/*

Chud 04/18/25 (Fri) 21:03:58 №6746 [Quote]

>>6697 (OP)
bro i just /.{500}/ and it filters 99% of spam, but long posts are also filtered unadvisedly

Chud 04/18/25 (Fri) 21:25:14 №6759 [Quote]

File: 1721330145327533.jpg 📥︎ (664.21 KB, 1007x1007) ImgOps

>>6746
I was bored and I found it fun to work on.

Now handles post references correctly in spam filter,
skip valid >>123456 quotes but check following text for spam.
Only checks for post numbers between 100 and 999999999 inclusive.

// UserScript
// @name Spam Filter for Soyjak.st
// @namespace http://tampermonkey.net/
// @version 2.2
// @description Hide spammy posts automatically
// @match *://*soyjak.st/*
// /UserScript

const thresholds = {
repeatThreshold: 3,
densityThreshold: 0.22,
elongationThreshold: 3
};

// isElongated function
function isElongated(word, threshold) {
let elongation = {};
for (let i = 1; i < word.length; i++) {
elongation[word[i]] = (elongation[word[i]] || 0) + 1;
if (elongation[word[i]] >= threshold) {
return true;
}
}
return false;
}

// isSpam function
function isSpam(message, thresholds) {
// Check for repeated words and their density
const words = message.toLowerCase().split(/\s+/);
const wordCount = {};
let totalWords = 0;

for (let word of words) {
if (!word.trim()) continue;
quoteMatch = word.match(/^>>(\d{3,9})/);
if (quoteMatch) {
// Remove the quoted part for spam checking
word = word.slice(quoteMatch[0].length);
if (!word) continue;
}

totalWords++;

if (isElongated(word, thresholds.elongationThreshold)) {
console.log(`${word} is spam!!!`);
return true;
}
wordCount[word] = (wordCount[word] || 0) + 1;
}

for (const [word, count] of Object.entries(wordCount)) {
const density = count / totalWords;
if (count >= thresholds.repeatThreshold && density >= thresholds.densityThreshold) {
return true;
}
}

return false;
}

const postElements = document.querySelectorAll('div.post.reply div.body');

postElements.forEach((el) => {
const message = el.textContent.trim();
if (isSpam(message, thresholds)) {
const postContainer = el.closest('.post');
if (postContainer) {
postContainer.style.display = 'none'; // Hide the whole post
const next = postContainer.nextSibling;
if (next && next.nodeName === 'BR') {
next.remove();
}
}
}
});

Chud 04/18/25 (Fri) 23:22:55 №6830 [Quote]

heading {
font-weight: normal !important;
}

.post.reply:has(.files[style="display: none;"]),
.post.reply:has(.files[style="display: none;"]) + br,
.post.reply:has(.body[style="display: none;"]),
.post.reply:has(.body[style="display: none;"]) + br,
div.post.reply:has(a[href*="sage"]),
div.post.reply:has(a[href*="sage"]) + br {
display: none !important;
}

div.post.reply div.body {
overflow-y: auto;
max-height: 50vh;
}

div.post.reply {
max-width: 98% !important;
width: 98% !important;
}

.post.reply:has([download*="cado"]),
.post.reply:has([download*="cado"]) + br,
div.mix:has(img[data-subject*="coinslot" i]) {
display: none !important;
}

Chud 04/19/25 (Sat) 03:45:12 №6955 [Quote]

File: 1743489895994183.jpg 📥︎ (137.3 KB, 1440x1799) ImgOps

Now it dynamically filters for new posts before you can see how retarded it was.

// UserScript
// @name Spam Filter for Soyjak.st
// @namespace http://tampermonkey.net/
// @version 2.3
// @description Hide spammy posts automatically
// @match *://*soyjak.st/*
// /UserScript

const thresholds = {
repeatThreshold: 10,
densityThreshold: 0.22,
elongationThreshold: 10
};

// isElongated function
function isElongated(word, threshold) {
let elongation = {};
for (let i = 1; i < word.length; i++) {
elongation[word[i]] = (elongation[word[i]] || 0) + 1;
if (elongation[word[i]] >= threshold) {
return true;
}
}
return false;
}

// isSpam function
function isSpam(message, thresholds) {
// Check for repeated words and their density
const words = message.toLowerCase().split(/\s+/);
const wordCount = {};
let totalWords = 0;

for (let word of words) {
if (!word.trim()) continue;

quoteMatch = word.match(/^>>(\d{1,9})/);
// Check for quotes and remove them
while (quoteMatch) {
// Remove the quoted part for spam checking
word = word.slice(quoteMatch[0].length);
quoteMatch = word.match(/^>>(\d{1,9})/);
if (!word) continue;
}

totalWords++;

if (isElongated(word, thresholds.elongationThreshold)) {
console.log(`${word} is spam!!!`);
return true;
}
wordCount[word] = (wordCount[word] || 0) + 1;
}

for (const count of Object.values(wordCount)) {
const density = count / totalWords;
if (count >= thresholds.repeatThreshold && density >= thresholds.densityThreshold) {
return true;
}
}

return false;
}
// Function to process a single post element
function processPostElement(el) {
const message = el.textContent.trim();
if (isSpam(message, thresholds)) {
const postContainer = el.closest('.post');
if (postContainer) {
postContainer.style.display = 'none'; // Hides the whole post
const next = postContainer.nextSibling;
if (next && next.nodeName === 'BR') {
next.remove();
}
}
}
}

const postElements = document.querySelectorAll('div.post.reply div.body');
postElements.forEach(processPostElement);

// MutationObserver to watch for new posts
const observer = new MutationObserver((mutations) => {
mutations.forEach((mutation) => {
if (mutation.type === 'childList' && mutation.addedNodes.length > 0) {
mutation.addedNodes.forEach((node) => {
// Check if the added node is a post or contains posts
if (node.nodeType === Node.ELEMENT_NODE) {
const newPostBodies = node.matches('div.post.reply div.body')
? [node]
: node.querySelectorAll('div.post.reply div.body');
newPostBodies.forEach(processPostElement);
}
});
}
});
});

// Observe the parent container
const threadContainer = document.querySelector('div.thread') || document.body;
observer.observe(threadContainer, {
childList: true,
subtree: true
});

Chud 04/19/25 (Sat) 03:55:37 №6961 [Quote]

File: GEG.png 📥︎ (12.01 KB, 600x800) ImgOps

raping slitty chinky yellow whores with my BWC

Chud 04/19/25 (Sat) 06:40:39 №7029 [Quote]

File: catacando.gif 📥︎ (2.75 MB, 1720x1632) ImgOps

spent too much time on this raisin
TY for filters i am codelet

Chud 04/19/25 (Sat) 07:03:08 №7051 [Quote]

>>6697 (OP)
This script is a spam detection and filtering system for a website (likely a forum or message board). It identifies spam messages by looking for three specific patterns and then hides posts that match these patterns. Here's how it works:

### Spam Detection Logic

The script identifies spam through three criteria:

1. Word elongation - It checks if any word has the same character repeated multiple times in a row (e.g., "hellooooo"). If a character repeats 4 or more times consecutively (the `elongationThreshold`), the message is considered spam.

2. Word repetition - It counts how many times each word appears in a message. If any word appears 3 or more times (the `repeatThreshold`), it might be spam.

3. Word density - For repeated words, it calculates how much of the total message consists of that word. If a word appears frequently enough to make up 22% or more of the total words (the `densityThreshold`) AND it meets the repetition threshold, the message is considered spam.

### Implementation Steps

1. The `isElongated()` function checks for character repetition within words
2. The `isSpam()` function:
- Splits the message into words
- Checks each word for elongation
- Counts word frequency
- Calculates word density
- Returns true if any spam criteria are met

3. The DOM manipulation section:
- Finds all message body elements on the page with `document.querySelectorAll('div.post.reply div.body')`
- Tests each message with the spam detection function
- Hides posts identified as spam by setting `display: 'none'`
- Removes any line break (`<br>`) elements that follow the hidden post

### How It Fights Spam

This targets common spam tactics like:
- Repeated words (e.g., "buy buy buy buy")
- Stretched out text (e.g., "hiiiiiii" or "frreeeeee")
- Messages with extremely low word variety

It's particularly effective against low-effort spam that relies on repetition and unusual text patterns, while being simple enough to run client-side in a browser.

Chud 04/19/25 (Sat) 07:41:03 №7083 [Quote]

coal

Chud 04/19/25 (Sat) 07:55:57 №7091 [Quote]

jannies should block these scripts so 4cucks had to adapt to bait geg

Chud 04/19/25 (Sat) 21:41:24 №7467 [Quote]

File: 1741119330284628.jpg 📥︎ (703.72 KB, 1440x1797) ImgOps

The spam filter now flags image and quote spam. Try this thread to test it.
>>>/soy/10710928

[code]
// UserScript
// @name Spam Filter for Soyjak.st
// @namespace http://tampermonkey.net/
// @version 3.0
// @description Hide spammy posts automatically
// @match *://*soyjak.st/*
// /UserScript

const thresholds = {
repeatThreshold: 10,
densityThreshold: 0.22,
elongationThreshold: 10,
maxImagesThreshold: 5,
imageSrcRepeatThreshold: 5,
};

// isElongated function
function isElongated(word, threshold) {
let elongation = {};
for (let i = 1; i < word.length; i++) {
elongation[word[i]] = (elongation[word[i]] || 0) + 1;
if (elongation[word[i]] >= threshold) {
return true;
}
}
return false;
}

// Checks for word, quote, and image spam
function isSpam(element, thresholds) {
// Check text content for repeated words and density
const message = element.textContent.toLowerCase();
const words = message.split(/\s+/);
const wordCount = {};
let totalQuotes = 0;
let totalWords = 0;

for (let word of words) {
if (!word.trim()) continue;

let quoteMatch = word.match(/^>>(\d{1,9})/);
while (quoteMatch) {
if (++totalQuotes > thresholds.repeatThreshold) {
return true;
}
word = word.slice(quoteMatch[0].length);
quoteMatch = word.match(/^>>(\d{1,9})/);
if (!word) continue;
}

totalWords++;

if (isElongated(word, thresholds.elongationThreshold)) {
return true;
}
wordCount[word] = (wordCount[word] || 0) + 1;
}

for (const count of Object.values(wordCount)) {
const density = count / totalWords;
if (count >= thresholds.repeatThreshold && density >= thresholds.densityThreshold) {
return true;
}
}

// Check for <img> tags
const images = element.querySelectorAll('img');
const imageSrcCount = {};

images.forEach((img) => {
const src = img.getAttribute('src') || '';
imageSrcCount[src] = (imageSrcCount[src] || 0) + 1;
});

if (images.length > thresholds.maxImagesThreshold) {
return true;
}

for (const count of Object.values(imageSrcCount)) {
if (count >= thresholds.imageSrcRepeatThreshold) {
return true;
}
}
return false;
}

// Function to process a single post element
function processPostElement(el) {
if (!isSpam(el, thresholds)) {
return;
}

const postContainer = el.closest('.post');

if (!postContainer) {
return;
}
postContainer.style.display = 'none'; // Hide the whole post
const next = postContainer.nextSibling;
if (next && next.nodeName === 'BR') {
next.remove();
}
}

// Set up MutationObserver to watch for new posts
const observer = new MutationObserver((mutations) => {
mutations.forEach((mutation) => {
if (mutation.type ! 'childList' || mutation.addedNodes.length = 0) return;

mutation.addedNodes.forEach((node) => {
if (node.nodeType === Node.ELEMENT_NODE) {
const newPostBodies = node.matches('div.post.reply div.body')
? [node]
: node.querySelectorAll('div.post.reply div.body');
newPostBodies.forEach(processPostElement);
}
});
});
});

// Observe the parent container of posts
const threadContainer = document.querySelector('div.thread') || document.body;
observer.observe(threadContainer, {
childList: true,
subtree: true
});

// Process existing posts, main logic
const postElements = document.querySelectorAll('div.post.reply div.body');
postElements.forEach(processPostElement);
[/code]

Chud 04/19/25 (Sat) 21:45:05 №7469 [Quote]

if (mutation.type != 'childList' || mutation.addedNodes.length = 0) return;

Dammit, the '= = =' makes it large and red. Just copy the code above and replace that line , should work regardless.

Chud 04/20/25 (Sun) 00:02:36 №7524 [Quote]

File: ClipboardImage.png 📥︎ (15.91 KB, 807x105) ImgOps

>>7469
Should look like this then?

Chud 04/20/25 (Sun) 00:14:22 №7531 [Quote]

>>7524
Should be != = without the space

Chud 04/20/25 (Sun) 00:15:20 №7533 [Quote]

>>7524
And it should be mutation.addedNodes.length == 0

Chud 04/20/25 (Sun) 14:16:42 №7942 [Quote]

>>6697 (OP)
>not using MutationObserver
ngmi

Chud 04/20/25 (Sun) 14:22:36 №7953 [Quote]

>>6697 (OP)
dilate

Chud 04/20/25 (Sun) 14:22:54 №7954 [Quote]

>>6716
based

Chud 04/20/25 (Sun) 16:59:22 №8103 [Quote]

>>7467
No one fucking cares about your pajeet code nigger

Chud 04/20/25 (Sun) 17:42:46 №8173 [Quote]

File: 1678934169050599.jpg 📥︎ (47.76 KB, 1024x796) ImgOps

forgot dot in the beginning (custom CSS that adds scroll bars to long posts and fully hides the hidden posts not just minimizes them also hides some nicocado spam):

.heading {
font-weight: normal !important;
}

.post.reply:has(.body[style="display: none;"]),
.post.reply:has(.body[style="display: none;"]) + br,
div.post.reply:has(a[href*="sage"]),
div.post.reply:has(a[href*="sage"]) + br {
display: none !important;
}

div.post.reply div.body {
overflow-y: auto;
max-height: 50vh;
}

div.post.reply {
max-width: 98% !important;
width: 98% !important;
}

div.mix:has(img[data-subject*="coinslot" i]) {
display: none !important;
}

Chud 04/20/25 (Sun) 17:43:27 №8174 [Quote]

>>7467
>// Set up MutationObserver to watch for new posts
based. we're evolving

Chud 04/20/25 (Sun) 20:28:49 №8425 [Quote]

>>7467
What a steaming pile of raisin, you niggers actually think it's fine to write code like this? Holy raisin, the learn 2 code meme is real.

Chud 04/20/25 (Sun) 22:06:36 №8551 [Quote]

>>8425
give some constructive feedback on what's wrong with it or shut the fuck up nigger

Chud 04/20/25 (Sun) 22:08:04 №8552 [Quote]

>>8551
I'm not gonna spoonfeed you everything that's wrong with it, retarded nigger.

Chud 04/20/25 (Sun) 22:14:50 №8564 [Quote]

ITT: yellow fever niggas vibe coding a shoddy userscript spam filter so they can spam their yellow fever threads on a woahjack appreciation forum

Chud 04/20/25 (Sun) 23:38:38 №8607 [Quote]

>>6697 (OP)
Don't ever attempt to write any piece of code ever again, this is literally embarassing to look at. It's utterly pathetic, kill yourself. It doesn't even work.

Chud 04/20/25 (Sun) 23:46:25 №8609 [Quote]

>>8607
>It doesn't even work.
works on my machine

Chud 04/20/25 (Sun) 23:49:29 №8612 [Quote]

>>6697 (OP)
>>6733
>>6739
>>6759
>>6955
Just stop, you can't code.
>>7467

Chud 04/20/25 (Sun) 23:52:57 №8613 [Quote]

>>8564

u gay nigga

Chud 04/21/25 (Mon) 00:51:14 №8631 [Quote]

>>8552
>I can't list a single example
the shut the fuck up nigger

Chud 04/21/25 (Mon) 01:46:37 №8648 [Quote]

>>8631
>needs to be spoonfed
lmfao

Chud 04/21/25 (Mon) 03:30:13 №8715 [Quote]

File: Screenshot 2025-04-04 2116….png 📥︎ (3.53 MB, 1920x1080) ImgOps

OP, I appreciate the work you've done
>>8173
Yours too

Chud 04/21/25 (Mon) 17:32:58 №9154 [Quote]

>>8715
based

Chud 04/22/25 (Tue) 00:11:15 №9363 [Quote]

>>6697 (OP)
Thanks. Still can't get the built in filter to work in the catalog.

Chud 04/22/25 (Tue) 00:20:42 №9368 [Quote]

>>9363
yea the catalog is its own type of beast

Chud 04/22/25 (Tue) 00:40:16 №9387 [Quote]

>>8612
>>8607
>>8552
>>8425

As a professional software engineer of 10 years I don't see anything obviously wrong with this code
What are you niggers smoking

Chud 04/22/25 (Tue) 00:54:03 №9393 [Quote]

File: 1742585916692335.webm 📥︎ (3.32 MB, 1080x1766) ImgOps