a0bf6c15f4
Resolves #52 This Pull Request introduces the **NexusSearchBox** search feature with premium unified styling, implements a robust **dynamic Qdrant collection auto-provisioning and batch-vector ingestion pipeline**, integrates a unified **Serilog logging infrastructure** for the Blazor Hybrid environment (MAUI), and resolves the **401 Unauthorized API header propagation error** inside mobile builds. ### 🚀 Key Implementations #### 1. Premium `NexusSearchBox` & Semantic Search UI * **NexusSearchBox Component:** Created an elegant search-as-you-type search box with smooth key navigation, quick-clearing, and seamless dynamic styling. * **Unified Aesthetics:** Refactored the search box isolated styling to align perfectly with the dashboard's design system using glassmorphism, `--nexus-neon` token gradients, and smooth pulse/fade animations. * **Semantic Search Integration:** Integrated semantic search query dispatching (`SearchLibrarySemanticallyQuery`) and wired up navigation seamlessly through the updated `ReaderNavigationService`. * **Tests Hardening:** Added/adapted query assertions in `QueryTests.cs` to guarantee safe parameterization and error boundary mapping. #### 2. Qdrant Collection Provisioning & Vector Ingestion * **Dynamic Auto-Provisioning:** Implemented dynamic checking and lazy-creation of the `knowledge_units` collection using 768 dimensions and Cosine distance. * **High-Performance Ingestion:** Optimized `ProcessKnowledgeUnitsAsync` with high-performance batch embedding generation using `_embeddingGenerator` and deterministic MD5 GUIDs for stable, duplicate-free upsertion. * **Database Cache Clear Sync:** Integrated Qdrant collection deletion in `ClearCacheAsync` to ensure absolute consistency between the PostgreSQL database cache and vector database indices. #### 3. Cross-Platform MAUI Logging (Serilog Infrastructure) * **Serilog Integration:** Configured cross-platform Serilog routing in `SerilogConfiguration.cs`, streaming diagnostic logs safely across native platforms and the Blazor Webview container. * **Interop Bridge:** Built `BlazorLoggingBridge.cs` to capture web console messages and pipe them directly to the native host logger. * **Demo Interface:** Added an interactive `SerilogDemo.razor` sandbox under Pages. #### 4. Resolving 401 Load Errors (Authentication Handler Flow) * **Authentication Header Handler:** Implemented the `MobileAuthenticationHeaderHandler` to correctly extract, validate, and inject bearer JWT tokens into outbound API requests. * **Configuration-based API Host:** Structured standard API URI routing to use clean configuration bindings in `appsettings.json`. --- ### 🧪 Verification & Build Status * Run `dotnet build` from the solution root: Successfully compiled the full multi-targeted solution (`Liczba błędów: 0`). * All unit and integration tests successfully executed and verified (`dotnet test`). --------- Co-authored-by: Marek Jasiński <jasins.marek@gmail.com> Co-authored-by: Marek Jaisński <jasins.marek@gmail.com> Reviewed-on: #51 Co-authored-by: Antigravity <antigravity@google.com> Co-committed-by: Antigravity <antigravity@google.com>
86 lines
3.1 KiB
C#
86 lines
3.1 KiB
C#
using System.Text.RegularExpressions;
|
|
using FluentResults;
|
|
using Microsoft.Extensions.Logging;
|
|
using NexusReader.Application.Abstractions.Services;
|
|
using VersOne.Epub;
|
|
|
|
namespace NexusReader.Infrastructure.Services;
|
|
|
|
public class EpubExtractor : IEpubExtractor
|
|
{
|
|
private readonly ILogger<EpubExtractor> _logger;
|
|
|
|
public EpubExtractor(ILogger<EpubExtractor> logger)
|
|
{
|
|
_logger = logger;
|
|
}
|
|
|
|
public async Task<Result<List<string>>> ExtractChaptersTextAsync(string relativePath, CancellationToken cancellationToken = default)
|
|
{
|
|
try
|
|
{
|
|
var fullPath = ResolvePath(relativePath);
|
|
if (string.IsNullOrEmpty(fullPath) || !File.Exists(fullPath))
|
|
{
|
|
_logger.LogError("[EpubExtractor] EPUB file not found at path: {FilePath}", relativePath);
|
|
return Result.Fail<List<string>>($"Plik EPUB nie został znaleziony na dysku: {relativePath}");
|
|
}
|
|
|
|
using var bookRef = await EpubReader.OpenBookAsync(fullPath);
|
|
var readingOrder = bookRef.GetReadingOrder();
|
|
|
|
if (readingOrder == null || !readingOrder.Any())
|
|
{
|
|
return Result.Fail<List<string>>("EPUB nie zawiera czytelnych rozdziałów.");
|
|
}
|
|
|
|
var chapters = new List<string>();
|
|
foreach (var chapterRef in readingOrder)
|
|
{
|
|
if (cancellationToken.IsCancellationRequested)
|
|
{
|
|
break;
|
|
}
|
|
|
|
var rawContent = await chapterRef.ReadContentAsTextAsync();
|
|
var cleanText = StripHtml(rawContent);
|
|
chapters.Add(cleanText);
|
|
}
|
|
|
|
return Result.Ok(chapters);
|
|
}
|
|
catch (Exception ex)
|
|
{
|
|
_logger.LogError(ex, "[EpubExtractor] Error extracting chapters from EPUB: {FilePath}", relativePath);
|
|
return Result.Fail<List<string>>(new Error("Failed to parse and extract text from EPUB").CausedBy(ex));
|
|
}
|
|
}
|
|
|
|
private static string? ResolvePath(string relativePath)
|
|
{
|
|
var normalized = relativePath.Replace('/', Path.DirectorySeparatorChar);
|
|
var currentDir = new DirectoryInfo(AppDomain.CurrentDomain.BaseDirectory);
|
|
while (currentDir != null)
|
|
{
|
|
var candidate = Path.Combine(currentDir.FullName, "wwwroot", normalized);
|
|
if (File.Exists(candidate)) return candidate;
|
|
|
|
var devCandidate = Path.Combine(currentDir.FullName, "src", "NexusReader.Web", "wwwroot", normalized);
|
|
if (File.Exists(devCandidate)) return devCandidate;
|
|
|
|
currentDir = currentDir.Parent;
|
|
}
|
|
return null;
|
|
}
|
|
|
|
private static string StripHtml(string html)
|
|
{
|
|
if (string.IsNullOrEmpty(html)) return string.Empty;
|
|
var clean = Regex.Replace(html, @"<(style|script)\b[^>]*>.*?</\1>", "", RegexOptions.IgnoreCase | RegexOptions.Singleline);
|
|
clean = Regex.Replace(clean, @"<[^>]*>", " ");
|
|
clean = System.Net.WebUtility.HtmlDecode(clean);
|
|
clean = Regex.Replace(clean, @"\s+", " ").Trim();
|
|
return clean;
|
|
}
|
|
}
|