Perf: domain deduper using only trie + DFS

This commit is contained in:
SukkaW
2024-05-11 16:49:06 +08:00
parent 1b116637d2
commit 160e7bfab7
3 changed files with 164 additions and 42 deletions

View File

@@ -3,22 +3,29 @@ import { createTrie } from './trie';
export function domainDeduper(inputDomains: string[], toArray?: true): string[];
export function domainDeduper(inputDomains: string[], toArray: false): Set<string>;
export function domainDeduper(inputDomains: string[], toArray = true): string[] | Set<string> {
const trie = createTrie(inputDomains, true);
const sets = new Set(inputDomains);
for (let i = 0, len1 = inputDomains.length; i < len1; i++) {
const d = inputDomains[i];
if (d[0] !== '.') {
continue;
}
trie.substractSetInPlaceFromFound(d, sets);
sets.delete(d.slice(1));
}
const trie = createTrie(inputDomains, true, true);
const dumped = trie.dump();
if (toArray) {
return Array.from(sets);
return dumped;
}
return new Set(dumped);
return sets;
// const trie = createTrie(inputDomains, true);
// const sets = new Set(inputDomains);
// for (let i = 0, len1 = inputDomains.length; i < len1; i++) {
// const d = inputDomains[i];
// if (d[0] !== '.') {
// continue;
// }
// trie.substractSetInPlaceFromFound(d, sets);
// sets.delete(d.slice(1));
// }
// if (toArray) {
// return Array.from(sets);
// }
// return sets;
}