56cd87dd7b
- Remove GPU/regex engine options; keep only azure_mini (1 credit) and azure_full (2 credits)
- Variable credit cost: engine-aware pre-check and charge in api/redact.php; PricingCatalog base = 1
- Fix ATTORNEY not preserved when keepOfficials=true: add to LLM prompt, generic-tag, pseudonym regexes
- Replace Azure credits hint with per-engine credit cost text (all 4 languages)
- Single-file upload only (was: up to 5); simplify status messages
- Clear previous redaction output and show pulsing spinner when a new run starts
- Add "Save to My Docs" button in redact output panel (corpus-save.js path)
- corpus-save.js: capture source_doc_ids from button dataset, pass in POST payload
- api/save-to-corpus.php: accept source_doc_ids, store first as source_url=corpus-doc:{id}
- doc-picker.js: show "✂ Redacted" badge for documents saved from the redact tool
- CSS: .redact-working spinner, doc-item__badge--redact pill styles
Co-Authored-By: Claude Sonnet 4.6 <noreply@anthropic.com>
78 lines
2.9 KiB
PHP
78 lines
2.9 KiB
PHP
<?php
|
|
declare(strict_types=1);
|
|
|
|
require_once __DIR__ . '/../includes/LegalTools.php';
|
|
|
|
dbnToolsRequireMethod('POST');
|
|
dbnToolsRequireAuth();
|
|
|
|
// Determine engine and its credit cost before the pre-flight credit check
|
|
$input = dbnToolsJsonInput(400000);
|
|
$_validEngines = ['azure_mini', 'azure_full'];
|
|
$_engine = in_array((string)($input['engine'] ?? ''), $_validEngines, true)
|
|
? (string)$input['engine'] : 'azure_mini';
|
|
$_engineCredits = $_engine === 'azure_full' ? 2 : 1;
|
|
|
|
$ftUid = dbnToolsFreeTierCheckAmount('redact', $_engineCredits);
|
|
|
|
dbnToolsWithChargedTelemetry('redact', '', $ftUid, function () use ($input): array {
|
|
$text = dbnToolsInjectDocContent($input, dbnToolsString($input, 'text', 128000, false));
|
|
if (mb_strlen(trim($text), 'UTF-8') < 10) {
|
|
dbnToolsAbort('Paste text, upload a file, or select a document before running.', 422, 'empty_text');
|
|
}
|
|
$mode = (string)($input['mode'] ?? 'standard');
|
|
$region = dbnToolsNormalizeRegion($input['region'] ?? 'nordic');
|
|
$language = dbnToolsNormalizeLanguage($input['language'] ?? 'en');
|
|
|
|
$validEngines = ['azure_mini', 'azure_full'];
|
|
$engine = in_array((string)($input['engine'] ?? ''), $validEngines, true)
|
|
? (string)$input['engine']
|
|
: 'azure_mini';
|
|
|
|
$validFormats = ['contextual', 'generic', 'pseudonym'];
|
|
$outputFormat = in_array((string)($input['output_format'] ?? ''), $validFormats, true)
|
|
? (string)$input['output_format']
|
|
: 'contextual';
|
|
|
|
$keepOfficials = (bool)($input['keep_officials'] ?? false);
|
|
|
|
$aliases = [];
|
|
$rawAliases = $input['aliases'] ?? [];
|
|
if (is_array($rawAliases)) {
|
|
foreach (array_slice($rawAliases, 0, 20) as $item) {
|
|
if (!is_array($item)) {
|
|
continue;
|
|
}
|
|
$original = substr(trim((string)($item['original'] ?? '')), 0, 100);
|
|
$alias = substr(trim((string)($item['alias'] ?? '')), 0, 100);
|
|
if ($original !== '' && $alias !== '') {
|
|
$aliases[] = ['original' => $original, 'alias' => $alias];
|
|
}
|
|
}
|
|
}
|
|
|
|
$exemptNames = [];
|
|
$rawExempt = $input['exempt_names'] ?? [];
|
|
if (is_array($rawExempt)) {
|
|
foreach (array_slice($rawExempt, 0, 20) as $name) {
|
|
$name = substr(trim((string)$name), 0, 100);
|
|
if ($name !== '') {
|
|
$exemptNames[] = $name;
|
|
}
|
|
}
|
|
}
|
|
|
|
$rawTypes = $input['redact_types'] ?? [];
|
|
$redactTypes = [
|
|
'names' => ($rawTypes['names'] ?? true) !== false,
|
|
'orgs' => ($rawTypes['orgs'] ?? true) !== false,
|
|
'places' => ($rawTypes['places'] ?? true) !== false,
|
|
'dob' => ($rawTypes['dob'] ?? true) !== false,
|
|
];
|
|
|
|
return (new DbnLegalToolsService())->redact(
|
|
$text, $mode, $region, $language, $aliases,
|
|
$engine, $outputFormat, $keepOfficials, $exemptNames, $redactTypes
|
|
);
|
|
}, $_engineCredits);
|