Skip to content
Open
Show file tree
Hide file tree
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension


Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
189 changes: 135 additions & 54 deletions JS/edgechains/arakoodev/package.json
Original file line number Diff line number Diff line change
@@ -1,79 +1,160 @@
{


"name": "@arakoodev/edgechains.js",

"version": "0.1.23",

"main": "dist/index.js",

"files": [

"dist"

],

"exports": {

"./ai": "./dist/ai/src/index.js",

"./vector-db": "./dist/vector-db/src/index.js",
"./document-loader": "./dist/document-loader/src/index.js",
"./splitter": "./dist/splitter/src/index.js",
"./arakooserver": "./dist/arakooserver/src/index.js",
"./db": "./dist/db/src/index.js",
"./scraper": "./dist/scraper/src/index.js",
"./sync-rpc": "./dist/sync-rpc/index.js"

"./document-loader": "./dist/document-loader/src/index.js",

"./splitter": "./dist/splitter/src/index.js",

"./arakooserver": "./dist/arakooserver/src/index.js",

"./db": "./dist/db/src/index.js",

"./scraper": "./dist/scraper/src/index.js",

"./sync-rpc": "./dist/sync-rpc/index.js"

},

"scripts": {

"build": "rm -rf dist && tsc -b",

"lint": "eslint --ignore-path .eslintignore --ext .js,.ts",
"format": "prettier --ignore-path .gitignore --write \"**/*.+(js|ts|json)\"",
"test": "vitest"

"format": "prettier --ignore-path .gitignore --write \"**/*.+(js|ts|json)\"",

"test": "vitest"

},

"dependencies": {

"@aws-sdk/client-comprehend": "^3.1055.0",

"@babel/core": "^7.24.4",
"@babel/preset-env": "^7.24.4",
"@hono/node-server": "^0.6.0",
"@lifeomic/attempt": "^3.1.0",
"@playwright/test": "^1.45.3",
"@supabase/supabase-js": "^2.42.3",
"axios": "^1.7.4",
"axios-retry": "^4.1.0",
"cheerio": "^1.0.0-rc.12",
"cors": "^2.8.5",
"document": "^0.4.7",
"dts-bundle-generator": "^9.3.1",
"esbuild": "^0.20.2",
"hono": "3.9",
"jest-environment-jsdom": "^29.7.0",
"jsdom": "^24.1.0",
"node-html-parser": "^6.1.13",
"pdf-parse": "^1.1.1",
"pg": "^8.11.5",
"playwright": "^1.45.1",
"prettier": "^3.2.5",
"regenerator-runtime": "^0.14.1",
"request": "^2.88.2",
"retell-client-js-sdk": "^2.0.4",
"retell-sdk": "^4.9.0",
"retry": "^0.13.1",
"ts-node": "^10.9.2",
"typeorm": "^0.3.20",
"vitest": "^2.0.3",
"youtube-transcript": "^1.2.1",
"zod": "^3.23.8",
"zod-to-json-schema": "^3.23.0"

"@babel/preset-env": "^7.24.4",

"@hono/node-server": "^0.6.0",

"@lifeomic/attempt": "^3.1.0",

"@playwright/test": "^1.45.3",

"@supabase/supabase-js": "^2.42.3",

"axios": "^1.7.4",

"axios-retry": "^4.1.0",

"cheerio": "^1.0.0-rc.12",

"cors": "^2.8.5",

"document": "^0.4.7",

"dts-bundle-generator": "^9.3.1",

"esbuild": "^0.20.2",

"hono": "3.9",

"jest-environment-jsdom": "^29.7.0",

"jsdom": "^24.1.0",

"node-html-parser": "^6.1.13",

"pdf-parse": "^1.1.1",

"pg": "^8.11.5",

"playwright": "^1.45.1",

"prettier": "^3.2.5",

"regenerator-runtime": "^0.14.1",

"request": "^2.88.2",

"retell-client-js-sdk": "^2.0.4",

"retell-sdk": "^4.9.0",

"retry": "^0.13.1",

"ts-node": "^10.9.2",

"typeorm": "^0.3.20",

"vitest": "^2.0.3",

"youtube-transcript": "^1.2.1",

"zod": "^3.23.8",

"zod-to-json-schema": "^3.23.0"

},

"keywords": [],

"author": "",

"license": "ISC",

"devDependencies": {

"@babel/preset-typescript": "^7.24.1",

"@types/cors": "^2.8.17",
"@types/jest": "^29.5.12",
"@types/node": "^20.17.2",
"@types/pdf-parse": "^1.1.4",
"@types/ws": "^8.5.12",
"buffer": "^6.0.3",
"crypto-browserify": "^3.12.1",
"jest": "^29.7.0",
"process": "^0.11.10",
"stream-browserify": "^3.0.0",
"stream-http": "^3.2.0",
"ts-jest": "^29.1.2",
"ts-loader": "^9.5.1",
"typescript": "^5.6.3",
"util": "^0.12.5"

"@types/jest": "^29.5.12",

"@types/node": "^20.17.2",

"@types/pdf-parse": "^1.1.4",

"@types/ws": "^8.5.12",

"buffer": "^6.0.3",

"crypto-browserify": "^3.12.1",

"jest": "^29.7.0",

"process": "^0.11.10",

"stream-browserify": "^3.0.0",

"stream-http": "^3.2.0",

"ts-jest": "^29.1.2",

"ts-loader": "^9.5.1",

"typescript": "^5.6.3",

"util": "^0.12.5"

}

}

7 changes: 6 additions & 1 deletion JS/edgechains/arakoodev/src/ai/src/index.ts
Original file line number Diff line number Diff line change
@@ -1,5 +1,10 @@
export { OpenAI } from "./lib/openai/openai.js";
xport { OpenAI } from "./lib/openai/openai.js";
export { GeminiAI } from "./lib/gemini/gemini.js";
export { LlamaAI } from "./lib/llama/llama.js";
export { RetellAI } from "./lib/retell-ai/retell.js";
export { RetellWebClient } from "./lib/retell-ai/retellWebClient.js";
export { AwsComprehendRedactor } from "./lib/aws-comprehend/comprehendRedactor.js";
export type {
AwsComprehendRedactorOptions,
ChatInputWithPrompt,
} from "./lib/aws-comprehend/comprehendRedactor.js";
Original file line number Diff line number Diff line change
@@ -0,0 +1,94 @@
import {
ComprehendClient,
DetectPiiEntitiesCommand,
LanguageCode,
PiiEntity,
} from "@aws-sdk/client-comprehend";

interface ComprehendClientLike {
send(command: DetectPiiEntitiesCommand): Promise<{ Entities?: PiiEntity[] }>;
}

interface MessageLike {
content: string;
[key: string]: unknown;
}

export interface AwsComprehendRedactorOptions {
client?: ComprehendClientLike;
region?: string;
languageCode?: LanguageCode;
minScore?: number;
entityTypes?: string[];
mask?: string | ((entity: PiiEntity) => string);
}

export interface ChatInputWithPrompt {
prompt?: string;
messages?: MessageLike[];
[key: string]: unknown;
}

export class AwsComprehendRedactor {
private readonly client: ComprehendClientLike;
private readonly languageCode: LanguageCode;
private readonly minScore: number;
private readonly entityTypes?: Set<string>;
private readonly mask: string | ((entity: PiiEntity) => string);

constructor(options: AwsComprehendRedactorOptions = {}) {
this.client =
options.client ||
new ComprehendClient({
region: options.region || process.env.AWS_REGION || process.env.AWS_DEFAULT_REGION,
});
this.languageCode = options.languageCode || LanguageCode.EN;
this.minScore = options.minScore ?? 0;
this.entityTypes = options.entityTypes ? new Set(options.entityTypes) : undefined;
this.mask = options.mask || ((entity) => `[REDACTED_${entity.Type || "PII"}]`);
}

async redactText(text: string): Promise<string> {
if (!text) {
return text;
}

const response = await this.client.send(
new DetectPiiEntitiesCommand({
Text: text,
LanguageCode: this.languageCode,
})
);

const entities = (response.Entities || [])
.filter((entity) => entity.BeginOffset !== undefined && entity.EndOffset !== undefined)
.filter((entity) => (entity.Score ?? 1) >= this.minScore)
.filter((entity) => !this.entityTypes || this.entityTypes.has(entity.Type || ""))
.sort((a, b) => (b.BeginOffset || 0) - (a.BeginOffset || 0));

return entities.reduce((redacted, entity) => {
const begin = entity.BeginOffset || 0;
const end = entity.EndOffset || begin;
const replacement = typeof this.mask === "function" ? this.mask(entity) : this.mask;

return redacted.slice(0, begin) + replacement + redacted.slice(end);
}, text);
}

async redactMessages<T extends MessageLike>(messages: T[]): Promise<T[]> {
return await Promise.all(
messages.map(async (message) => ({
...message,
content: await this.redactText(message.content),
}))
);
}

async redactChatInput<T extends ChatInputWithPrompt>(input: T): Promise<T> {
return {
...input,
prompt: input.prompt === undefined ? undefined : await this.redactText(input.prompt),
messages: input.messages === undefined ? undefined : await this.redactMessages(input.messages),
};
}
}
Loading
Loading