Redact: multi-doc upload, contextual person naming, aliases
- Extract limit raised from 32K to 128K chars per file (long legal docs now fit) - Redact API body/text limits raised (400KB / 128K chars) to match - Upload zone accepts multiple files (up to 5); extracted text concatenated with doc separator and combined before redaction; shows per-file char counts - LLM redact pass now infers contextual person roles (FATHER, MOTHER, CHILD, ATTORNEY, JUDGE, etc.) instead of generic [PERSON] for all names; same individual gets consistent tag throughout the document - Tag validation widened to allow any [A-Za-z0-9_- ] pattern (not just the five hardcoded tags), supporting contextual and alias tags - Alias UI added to Redact mode: user maps real names to bracketed aliases (e.g. "David Jr" -> [Junior]); aliases injected into LLM system prompt as override instructions; max 20 aliases, 100 chars each - max_tokens raised from 2000 to 4000; timeout from 60s to 90s for larger docs Co-Authored-By: Claude Sonnet 4.6 <noreply@anthropic.com>
This commit is contained in:
+89
-26
@@ -84,8 +84,11 @@ document.addEventListener('DOMContentLoaded', () => {
|
||||
uploadInput: document.querySelector('#uploadInput'),
|
||||
uploadPrompt: document.querySelector('#uploadPrompt'),
|
||||
uploadFileInfo: document.querySelector('#uploadFileInfo'),
|
||||
uploadFileName: document.querySelector('#uploadFileName'),
|
||||
uploadFileList: document.querySelector('#uploadFileList'),
|
||||
uploadClear: document.querySelector('#uploadClear'),
|
||||
aliasSection: document.querySelector('#aliasSection'),
|
||||
addAliasRow: document.querySelector('#addAliasRow'),
|
||||
aliasRows: document.querySelector('#aliasRows'),
|
||||
});
|
||||
|
||||
els.tabs.forEach((button) => {
|
||||
@@ -95,6 +98,7 @@ document.addEventListener('DOMContentLoaded', () => {
|
||||
els.passcodeForm.addEventListener('submit', submitPasscode);
|
||||
els.healthButton.addEventListener('click', checkHealth);
|
||||
setupUpload();
|
||||
setupAliases();
|
||||
setTool(state.activeTool);
|
||||
|
||||
if (state.authenticated) {
|
||||
@@ -122,7 +126,9 @@ function setTool(toolName) {
|
||||
els.languageControl.classList.toggle('is-hidden', !tool.usesLanguage);
|
||||
els.redactionControl.classList.toggle('is-hidden', toolName !== 'redact');
|
||||
els.uploadZone.classList.toggle('is-hidden', toolName !== 'redact');
|
||||
els.aliasSection.classList.toggle('is-hidden', toolName !== 'redact');
|
||||
resetUpload();
|
||||
resetAliases();
|
||||
els.status.textContent = '';
|
||||
renderTrace([]);
|
||||
}
|
||||
@@ -170,6 +176,7 @@ async function runTool(event) {
|
||||
if (state.activeTool === 'redact') {
|
||||
payload.mode = currentRedactionMode();
|
||||
payload.region = currentRedactionRegion();
|
||||
payload.aliases = getAliases();
|
||||
}
|
||||
|
||||
setBusy(true);
|
||||
@@ -200,7 +207,7 @@ function resetUpload() {
|
||||
els.uploadInput.value = '';
|
||||
els.uploadPrompt.classList.remove('is-hidden');
|
||||
els.uploadFileInfo.classList.add('is-hidden');
|
||||
els.uploadFileName.textContent = '';
|
||||
els.uploadFileList.innerHTML = '';
|
||||
els.uploadZone.classList.remove('is-drag-over');
|
||||
}
|
||||
|
||||
@@ -219,8 +226,7 @@ function setupUpload() {
|
||||
els.uploadZone.addEventListener('drop', (e) => {
|
||||
e.preventDefault();
|
||||
els.uploadZone.classList.remove('is-drag-over');
|
||||
const file = e.dataTransfer?.files?.[0];
|
||||
if (file) handleFileUpload(file);
|
||||
if (e.dataTransfer?.files?.length) handleFiles(e.dataTransfer.files);
|
||||
});
|
||||
|
||||
els.uploadZone.addEventListener('click', (e) => {
|
||||
@@ -230,49 +236,74 @@ function setupUpload() {
|
||||
});
|
||||
|
||||
els.uploadInput.addEventListener('change', () => {
|
||||
const file = els.uploadInput.files?.[0];
|
||||
if (file) handleFileUpload(file);
|
||||
if (els.uploadInput.files?.length) handleFiles(els.uploadInput.files);
|
||||
});
|
||||
|
||||
els.uploadClear.addEventListener('click', () => {
|
||||
resetUpload();
|
||||
els.input.value = '';
|
||||
els.status.textContent = '';
|
||||
});
|
||||
}
|
||||
|
||||
async function handleFileUpload(file) {
|
||||
async function handleFiles(fileList) {
|
||||
const allowed = ['pdf', 'docx', 'txt'];
|
||||
const ext = file.name.split('.').pop().toLowerCase();
|
||||
if (!allowed.includes(ext)) {
|
||||
els.status.textContent = 'Unsupported file type. Use .pdf, .docx, or .txt.';
|
||||
return;
|
||||
const files = Array.from(fileList).slice(0, 5);
|
||||
|
||||
for (const file of files) {
|
||||
const ext = file.name.split('.').pop().toLowerCase();
|
||||
if (!allowed.includes(ext)) {
|
||||
els.status.textContent = `Skipped ${file.name}: unsupported type. Use .pdf, .docx, or .txt.`;
|
||||
return;
|
||||
}
|
||||
}
|
||||
|
||||
els.status.textContent = `Extracting ${file.name}…`;
|
||||
els.status.textContent = files.length === 1 ? `Extracting ${files[0].name}…` : `Extracting ${files.length} files…`;
|
||||
setBusy(true);
|
||||
|
||||
const parts = [];
|
||||
let totalChars = 0;
|
||||
let anyTruncated = false;
|
||||
|
||||
try {
|
||||
const formData = new FormData();
|
||||
formData.append('file', file);
|
||||
for (const file of files) {
|
||||
const formData = new FormData();
|
||||
formData.append('file', file);
|
||||
|
||||
const resp = await fetch('api/extract.php', {
|
||||
method: 'POST',
|
||||
credentials: 'same-origin',
|
||||
body: formData,
|
||||
});
|
||||
const data = await resp.json().catch(() => ({}));
|
||||
const resp = await fetch('api/extract.php', {
|
||||
method: 'POST',
|
||||
credentials: 'same-origin',
|
||||
body: formData,
|
||||
});
|
||||
const data = await resp.json().catch(() => ({}));
|
||||
|
||||
if (!resp.ok || !data.ok) {
|
||||
throw new Error(data.error?.message || `Extraction failed (HTTP ${resp.status}).`);
|
||||
if (!resp.ok || !data.ok) {
|
||||
throw new Error(data.error?.message || `Extraction failed for ${file.name} (HTTP ${resp.status}).`);
|
||||
}
|
||||
|
||||
parts.push({ filename: file.name, chars: data.chars, truncated: data.truncated, text: data.text });
|
||||
totalChars += data.chars;
|
||||
if (data.truncated) anyTruncated = true;
|
||||
}
|
||||
|
||||
els.input.value = data.text;
|
||||
els.uploadFileName.textContent = file.name;
|
||||
const combined = parts.length === 1
|
||||
? parts[0].text
|
||||
: parts.map((p) => `--- Document: ${p.filename} ---\n\n${p.text}`).join('\n\n');
|
||||
|
||||
const MAX_COMBINED = 128000;
|
||||
const combinedTruncated = combined.length > MAX_COMBINED;
|
||||
els.input.value = combinedTruncated ? combined.slice(0, MAX_COMBINED) : combined;
|
||||
|
||||
els.uploadFileList.innerHTML = parts
|
||||
.map((p) => `<li><span class="upload-filename">${escapeHtml(p.filename)}</span><span class="upload-chars">${p.chars.toLocaleString()} chars${p.truncated ? ' • per-file limit reached' : ''}</span></li>`)
|
||||
.join('');
|
||||
els.uploadPrompt.classList.add('is-hidden');
|
||||
els.uploadFileInfo.classList.remove('is-hidden');
|
||||
|
||||
const note = data.truncated ? ' (truncated to 32 000 chars)' : '';
|
||||
els.status.textContent = `Extracted ${data.chars.toLocaleString()} chars from ${file.name}${note}.`;
|
||||
const truncNote = (anyTruncated || combinedTruncated) ? ' — truncated to 128 000 char limit' : '';
|
||||
els.status.textContent = parts.length === 1
|
||||
? `Extracted ${totalChars.toLocaleString()} chars from ${parts[0].filename}${truncNote}.`
|
||||
: `Extracted ${totalChars.toLocaleString()} chars total from ${parts.length} files${truncNote}.`;
|
||||
} catch (err) {
|
||||
els.status.textContent = err.message;
|
||||
resetUpload();
|
||||
@@ -281,6 +312,38 @@ async function handleFileUpload(file) {
|
||||
}
|
||||
}
|
||||
|
||||
function setupAliases() {
|
||||
els.addAliasRow.addEventListener('click', () => {
|
||||
const row = document.createElement('div');
|
||||
row.className = 'alias-row';
|
||||
row.innerHTML = [
|
||||
'<input type="text" class="alias-original" placeholder="Real name" maxlength="100">',
|
||||
'<span class="alias-arrow" aria-hidden="true">→</span>',
|
||||
'<input type="text" class="alias-label" placeholder="Alias (without brackets)" maxlength="100">',
|
||||
'<button type="button" class="alias-remove" aria-label="Remove alias">×</button>',
|
||||
].join('');
|
||||
els.aliasRows.appendChild(row);
|
||||
row.querySelector('.alias-original').focus();
|
||||
});
|
||||
|
||||
els.aliasRows.addEventListener('click', (e) => {
|
||||
const btn = e.target.closest('.alias-remove');
|
||||
if (btn) btn.closest('.alias-row').remove();
|
||||
});
|
||||
}
|
||||
|
||||
function getAliases() {
|
||||
return Array.from(els.aliasRows.querySelectorAll('.alias-row')).flatMap((row) => {
|
||||
const original = row.querySelector('.alias-original')?.value.trim() ?? '';
|
||||
const alias = row.querySelector('.alias-label')?.value.trim() ?? '';
|
||||
return original && alias ? [{ original, alias }] : [];
|
||||
});
|
||||
}
|
||||
|
||||
function resetAliases() {
|
||||
if (els.aliasRows) els.aliasRows.innerHTML = '';
|
||||
}
|
||||
|
||||
async function checkHealth() {
|
||||
els.healthPill.textContent = 'Checking...';
|
||||
try {
|
||||
|
||||
Reference in New Issue
Block a user