188 lines
7.3 KiB
PHP
188 lines
7.3 KiB
PHP
<?php
|
|
declare(strict_types=1);
|
|
|
|
require_once __DIR__ . '/../includes/bootstrap.php';
|
|
require_once __DIR__ . '/../includes/DiscrepancyAgent.php';
|
|
require_once __DIR__ . '/../includes/CaseResults.php';
|
|
require_once __DIR__ . '/../includes/ToolModels.php';
|
|
|
|
dbnToolsRequireMethod('POST');
|
|
dbnToolsRequireAuth();
|
|
$ftUid = dbnToolsFreeTierCheck('discrepancy');
|
|
$ftRemaining = dbnToolsFreeTierDeduct($ftUid, 'discrepancy');
|
|
|
|
@ini_set('output_buffering', '0');
|
|
@ini_set('zlib.output_compression', '0');
|
|
@ini_set('implicit_flush', '1');
|
|
while (ob_get_level() > 0) { @ob_end_clean(); }
|
|
ob_implicit_flush(true);
|
|
|
|
header('Content-Type: application/x-ndjson; charset=utf-8');
|
|
header('Cache-Control: no-store');
|
|
header('X-Accel-Buffering: no');
|
|
if ($ftRemaining >= 0) { header('X-Credits-Remaining: ' . $ftRemaining); }
|
|
|
|
$language = 'en';
|
|
$startTime = microtime(true);
|
|
|
|
$emit = function (string $event, array $payload = []) use ($startTime): void {
|
|
$payload['event'] = $event;
|
|
$payload['t_ms'] = (int)round((microtime(true) - $startTime) * 1000);
|
|
echo json_encode($payload, JSON_UNESCAPED_UNICODE | JSON_UNESCAPED_SLASHES) . "\n";
|
|
@flush();
|
|
};
|
|
|
|
try {
|
|
// Parse payload (always multipart — two files required)
|
|
$payloadRaw = (string)($_POST['payload'] ?? '');
|
|
if ($payloadRaw === '') {
|
|
throw new DbnToolsHttpException('Missing payload field.', 422, 'missing_payload');
|
|
}
|
|
$input = json_decode($payloadRaw, true);
|
|
if (!is_array($input)) {
|
|
throw new DbnToolsHttpException('Invalid payload JSON.', 422, 'invalid_payload_json');
|
|
}
|
|
|
|
$language = dbnToolsNormalizeLanguage($input['language'] ?? 'en');
|
|
$engine = ToolModels::engineForUser($ftUid, (string)($input['engine'] ?? 'azure_mini'));
|
|
$sliceInput = $input['slices'] ?? [];
|
|
|
|
// Extract file A
|
|
$emit('progress', ['detail' => 'Reading Document A…']);
|
|
$fileEntryA = $_FILES['file_a'] ?? null;
|
|
if (!$fileEntryA || ($fileEntryA['error'] ?? UPLOAD_ERR_NO_FILE) !== UPLOAD_ERR_OK) {
|
|
throw new DbnToolsHttpException(
|
|
'Document A is required. Upload a PDF, DOCX, or TXT file.',
|
|
422, 'missing_file_a'
|
|
);
|
|
}
|
|
$extractedA = dbnToolsExtractUploadedFile([
|
|
'name' => $fileEntryA['name'] ?? '',
|
|
'type' => $fileEntryA['type'] ?? '',
|
|
'tmp_name' => $fileEntryA['tmp_name'] ?? '',
|
|
'error' => $fileEntryA['error'] ?? UPLOAD_ERR_NO_FILE,
|
|
'size' => $fileEntryA['size'] ?? 0,
|
|
]);
|
|
$fileA = [
|
|
'filename' => $extractedA['filename'],
|
|
'text' => $extractedA['text'],
|
|
'chars' => $extractedA['chars'],
|
|
'truncated' => $extractedA['truncated'],
|
|
];
|
|
$emit('progress', ['detail' => sprintf('Document A extracted: %s (%d chars%s)',
|
|
$extractedA['filename'], $extractedA['chars'],
|
|
!empty($extractedA['truncated']) ? ', truncated' : '')]);
|
|
|
|
// Extract file B
|
|
$emit('progress', ['detail' => 'Reading Document B…']);
|
|
$fileEntryB = $_FILES['file_b'] ?? null;
|
|
if (!$fileEntryB || ($fileEntryB['error'] ?? UPLOAD_ERR_NO_FILE) !== UPLOAD_ERR_OK) {
|
|
throw new DbnToolsHttpException(
|
|
'Document B is required. Upload a PDF, DOCX, or TXT file.',
|
|
422, 'missing_file_b'
|
|
);
|
|
}
|
|
$extractedB = dbnToolsExtractUploadedFile([
|
|
'name' => $fileEntryB['name'] ?? '',
|
|
'type' => $fileEntryB['type'] ?? '',
|
|
'tmp_name' => $fileEntryB['tmp_name'] ?? '',
|
|
'error' => $fileEntryB['error'] ?? UPLOAD_ERR_NO_FILE,
|
|
'size' => $fileEntryB['size'] ?? 0,
|
|
]);
|
|
$fileB = [
|
|
'filename' => $extractedB['filename'],
|
|
'text' => $extractedB['text'],
|
|
'chars' => $extractedB['chars'],
|
|
'truncated' => $extractedB['truncated'],
|
|
];
|
|
$emit('progress', ['detail' => sprintf('Document B extracted: %s (%d chars%s)',
|
|
$extractedB['filename'], $extractedB['chars'],
|
|
!empty($extractedB['truncated']) ? ', truncated' : '')]);
|
|
|
|
if (($fileA['text'] ?? '') === '') {
|
|
throw new DbnToolsHttpException('Could not extract text from Document A.', 422, 'empty_file_a');
|
|
}
|
|
if (($fileB['text'] ?? '') === '') {
|
|
throw new DbnToolsHttpException('Could not extract text from Document B.', 422, 'empty_file_b');
|
|
}
|
|
|
|
$emit('start', [
|
|
'engine' => $engine,
|
|
'language' => $language,
|
|
'file_a' => $fileA['filename'],
|
|
'file_b' => $fileB['filename'],
|
|
]);
|
|
|
|
// Optional: append the user's case-context as supplementary background to Doc A.
|
|
$useMyCase = !empty($input['use_my_case']);
|
|
if ($useMyCase) {
|
|
$retrievalQuery = mb_substr((string)$fileA['text'], 0, 2000, 'UTF-8');
|
|
$caseBlock = dbnToolsCaseContext(true, $retrievalQuery, 5);
|
|
if ($caseBlock !== '') {
|
|
$fileA['text'] .= "\n\n" . $caseBlock;
|
|
}
|
|
}
|
|
|
|
$result = (new DbnDiscrepancyAgent())->run(
|
|
$fileA,
|
|
$fileB,
|
|
$engine,
|
|
$language,
|
|
is_array($sliceInput) ? $sliceInput : [],
|
|
$emit
|
|
);
|
|
|
|
$result['ok'] = true;
|
|
$result['latency_ms'] = (int)round((microtime(true) - $startTime) * 1000);
|
|
|
|
dbnToolsLogMetadata([
|
|
'tool' => 'discrepancy',
|
|
'language' => $language,
|
|
'ok' => true,
|
|
'latency_ms' => $result['latency_ms'],
|
|
'source_count' => (int)($result['trace_metadata']['source_count'] ?? 0),
|
|
'conflict_count' => (int)($result['trace_metadata']['conflict_count'] ?? 0),
|
|
'deleted_count' => (int)($result['trace_metadata']['deleted_count'] ?? 0),
|
|
'added_count' => (int)($result['trace_metadata']['added_count'] ?? 0),
|
|
'deployment' => $result['trace_metadata']['deployment'] ?? null,
|
|
]);
|
|
|
|
if ($ftUid > 0) {
|
|
$ownerId = CaseStore::caseResolveClientId($ftUid);
|
|
$resultId = CaseResults::save($ftUid, $ownerId, 'discrepancy', $input, $result, [
|
|
'used_case_context' => $useMyCase ? 1 : 0,
|
|
'case_doc_ids' => dbnToolsLastCaseDocIds(),
|
|
'model' => $result['trace_metadata']['deployment'] ?? $engine,
|
|
'latency_ms' => $result['latency_ms'],
|
|
'credits_charged' => FreeTier::cost('discrepancy'),
|
|
]);
|
|
if ($resultId > 0) {
|
|
$result['result_id'] = $resultId;
|
|
}
|
|
}
|
|
|
|
$emit('final', ['result' => $result]);
|
|
|
|
} catch (DbnToolsHttpException $e) {
|
|
$latency = (int)round((microtime(true) - $startTime) * 1000);
|
|
dbnToolsLogMetadata([
|
|
'tool' => 'discrepancy',
|
|
'language' => $language,
|
|
'ok' => false,
|
|
'latency_ms' => $latency,
|
|
'error_code' => $e->errorCode,
|
|
]);
|
|
$emit('error', ['code' => $e->errorCode, 'message' => $e->getMessage(), 'status' => $e->status]);
|
|
} catch (Throwable $e) {
|
|
error_log('DBN discrepancy fatal: ' . $e->getMessage());
|
|
$latency = (int)round((microtime(true) - $startTime) * 1000);
|
|
dbnToolsLogMetadata([
|
|
'tool' => 'discrepancy',
|
|
'language' => $language,
|
|
'ok' => false,
|
|
'latency_ms' => $latency,
|
|
'error_code' => 'internal_error',
|
|
]);
|
|
$emit('error', ['code' => 'internal_error', 'message' => 'The discrepancy finder could not complete this request.']);
|
|
}
|