Add Legal Analysis tool — two-pass DBN-legal pipeline
Restores the dbn-legal-agent-v3 fine-tune on ocelot (was silently aliased to plain qwen2.5:14b in LiteLLM since the viper retirement) and ships a new tool that uses it via a two-pass flow: Pass 1 (Azure 4o-mini) → extract up to 5 distinct legal issues Pass 2 (ocelot v3 only) → answer each issue, ≤350 tokens, with corpus Pass 3 (Azure 4o-mini) → synthesise overall assessment + next steps The 12GB-VRAM constraint motivates the split: dbn-legal-agent-v3 stays hot in VRAM through the 5 sequential per-issue calls because issue extraction and synthesis run on Azure, not on ocelot. New surface: - includes/LegalAnalysisAgent.php - api/legal-analysis.php (NDJSON streaming endpoint) - legal-analysis.php (dedicated tool page) - assets/js/legal-analysis.js (streamed UI with per-issue cards) - Save-result + case-result.php rendering for legal-analysis output - Nav registration in all four UI languages Add-on integration: a "⚖️🇳🇴 Run deep legal analysis on this text" button now appears on Summarize, Ask, and Redact result pages and streams the same pipeline inline below the existing result. Existing tools relabelled: the misleading "🇳🇴 Norwegian specialist v3 ⭐" option on advocate/deep-research/discrepancy/barnevernet is now honestly "DBN Legal Agent" — now that the real fine-tune is actually deployed, the label finally matches reality. The advocate.php v2 option was removed since the v2 GGUF is retired. Co-Authored-By: Claude Sonnet 4.6 <noreply@anthropic.com>
This commit is contained in:
@@ -0,0 +1,165 @@
|
||||
<?php
|
||||
declare(strict_types=1);
|
||||
|
||||
require_once __DIR__ . '/../includes/bootstrap.php';
|
||||
require_once __DIR__ . '/../includes/LegalAnalysisAgent.php';
|
||||
|
||||
dbnToolsRequireMethod('POST');
|
||||
dbnToolsRequireAuth();
|
||||
|
||||
@ini_set('output_buffering', '0');
|
||||
@ini_set('zlib.output_compression', '0');
|
||||
@ini_set('implicit_flush', '1');
|
||||
while (ob_get_level() > 0) { @ob_end_clean(); }
|
||||
ob_implicit_flush(true);
|
||||
|
||||
header('Content-Type: application/x-ndjson; charset=utf-8');
|
||||
header('Cache-Control: no-store');
|
||||
header('X-Accel-Buffering: no');
|
||||
|
||||
$startTime = microtime(true);
|
||||
$language = 'en';
|
||||
$creditDeducted = false;
|
||||
|
||||
$emit = function (string $event, array $payload = []) use ($startTime): void {
|
||||
$payload['event'] = $event;
|
||||
$payload['t_ms'] = (int)round((microtime(true) - $startTime) * 1000);
|
||||
echo json_encode($payload, JSON_UNESCAPED_UNICODE | JSON_UNESCAPED_SLASHES) . "\n";
|
||||
@flush();
|
||||
};
|
||||
|
||||
try {
|
||||
$input = dbnToolsJsonInput(400000);
|
||||
$language = dbnToolsNormalizeLanguage($input['language'] ?? 'en');
|
||||
$docType = (string)($input['doc_type'] ?? 'other');
|
||||
$allowedDocTypes = ['auto','barnevernet','adopsjon','emergency','samvær','fylkesnemnd','other'];
|
||||
if (!in_array($docType, $allowedDocTypes, true)) {
|
||||
$docType = 'other';
|
||||
}
|
||||
|
||||
$text = dbnToolsInjectDocContent($input, dbnToolsString($input, 'text', 128000, false));
|
||||
if (mb_strlen(trim($text), 'UTF-8') < 80) {
|
||||
throw new DbnToolsHttpException(
|
||||
'Paste at least 80 characters of text, upload a file, or select a document.',
|
||||
422, 'empty_text'
|
||||
);
|
||||
}
|
||||
|
||||
$emit('start', [
|
||||
'mode' => 'legal-analysis',
|
||||
'language' => $language,
|
||||
'doc_type' => $docType,
|
||||
'chars' => mb_strlen($text, 'UTF-8'),
|
||||
]);
|
||||
|
||||
$agent = new DbnLegalAnalysisAgent();
|
||||
|
||||
// Pass 1 — extract issues (Azure, fast); deduct credit AFTER this succeeds
|
||||
$emit('progress', ['step' => 'extracting_issues', 'detail' => 'Identifying distinct legal issues…']);
|
||||
$issues = $agent->extractIssues($text, $language, $docType);
|
||||
|
||||
if (empty($issues)) {
|
||||
$emit('final', [
|
||||
'result' => [
|
||||
'ok' => true,
|
||||
'issues' => [],
|
||||
'overall_assessment' => 'No discrete legal issues were identified in this document.',
|
||||
'next_steps' => [],
|
||||
'disclaimer' => 'Automated analysis — not legal advice.',
|
||||
'model' => 'dbn-legal-agent-v3',
|
||||
'doc_type' => $docType,
|
||||
'latency_ms' => (int)round((microtime(true) - $startTime) * 1000),
|
||||
],
|
||||
]);
|
||||
exit;
|
||||
}
|
||||
|
||||
// Deduct credit (gated until extract succeeds and at least one issue exists)
|
||||
$ftUid = dbnToolsFreeTierCheck('legal-analysis');
|
||||
$ftRemaining = dbnToolsFreeTierDeduct($ftUid, 'legal-analysis');
|
||||
$creditDeducted = true;
|
||||
if ($ftRemaining >= 0) {
|
||||
header('X-Credits-Remaining: ' . $ftRemaining);
|
||||
}
|
||||
|
||||
$emit('issues_extracted', [
|
||||
'count' => count($issues),
|
||||
'issues' => array_map(fn($i) => [
|
||||
'id' => $i['id'],
|
||||
'question' => $i['question'],
|
||||
'brief_context' => $i['brief_context'],
|
||||
'severity_hint' => $i['severity_hint'],
|
||||
], $issues),
|
||||
]);
|
||||
|
||||
// Pass 2 — answer each issue sequentially on ocelot (keeps fine-tune hot)
|
||||
$svc = new DbnLegalToolsService();
|
||||
$answered = [];
|
||||
foreach ($issues as $issue) {
|
||||
$emit('progress', [
|
||||
'step' => 'issue_searching_corpus',
|
||||
'detail' => sprintf('Issue %d: searching legal corpus…', $issue['id']),
|
||||
'issue_id' => $issue['id'],
|
||||
]);
|
||||
$corpusQuery = $issue['question'] . "\n" . $issue['brief_context'];
|
||||
$corpusContext = $svc->corpusContextForSummarize($corpusQuery, 3);
|
||||
|
||||
$emit('progress', [
|
||||
'step' => 'issue_answering',
|
||||
'detail' => sprintf('Issue %d: asking dbn-legal-agent-v3…', $issue['id']),
|
||||
'issue_id' => $issue['id'],
|
||||
]);
|
||||
$answer = $agent->answerIssue($issue, $corpusContext, $language);
|
||||
$answered[] = $answer;
|
||||
|
||||
$emit('issue_answered', ['issue' => $answer]);
|
||||
}
|
||||
|
||||
// Pass 3 — synthesise (Azure)
|
||||
$emit('progress', ['step' => 'synthesising', 'detail' => 'Synthesising overall assessment…']);
|
||||
$synth = $agent->synthesise($answered, $language, $docType);
|
||||
|
||||
$result = [
|
||||
'ok' => true,
|
||||
'issues' => $answered,
|
||||
'overall_assessment' => $synth['overall_assessment'],
|
||||
'next_steps' => $synth['next_steps'],
|
||||
'disclaimer' => $synth['disclaimer'],
|
||||
'doc_type' => $docType,
|
||||
'model' => 'dbn-legal-agent-v3',
|
||||
'latency_ms' => (int)round((microtime(true) - $startTime) * 1000),
|
||||
];
|
||||
|
||||
dbnToolsLogMetadata([
|
||||
'tool' => 'legal-analysis',
|
||||
'language' => $language,
|
||||
'ok' => true,
|
||||
'latency_ms' => $result['latency_ms'],
|
||||
'issue_count' => count($answered),
|
||||
'deployment' => 'dbn-legal-agent-v3',
|
||||
]);
|
||||
|
||||
$emit('final', ['result' => $result]);
|
||||
|
||||
} catch (DbnToolsHttpException $e) {
|
||||
$latency = (int)round((microtime(true) - $startTime) * 1000);
|
||||
dbnToolsLogMetadata([
|
||||
'tool' => 'legal-analysis',
|
||||
'language' => $language,
|
||||
'ok' => false,
|
||||
'latency_ms' => $latency,
|
||||
'error_code' => $e->errorCode,
|
||||
]);
|
||||
$emit('error', ['code' => $e->errorCode, 'message' => $e->getMessage(), 'status' => $e->status]);
|
||||
} catch (Throwable $e) {
|
||||
error_log('legal-analysis fatal: ' . $e->getMessage());
|
||||
$latency = (int)round((microtime(true) - $startTime) * 1000);
|
||||
dbnToolsLogMetadata([
|
||||
'tool' => 'legal-analysis',
|
||||
'language' => $language,
|
||||
'ok' => false,
|
||||
'latency_ms' => $latency,
|
||||
'error_code' => 'internal_error',
|
||||
]);
|
||||
$emit('error', ['code' => 'internal_error', 'message' => 'Legal analysis could not complete this request.']);
|
||||
}
|
||||
Reference in New Issue
Block a user