Real channel fetch (Telegram/Bale/Divar) + AI-audited automation engine + CI/CD

- Fetch: Telegram via t.me/s, Bale via Bot API, Divar via web-search (HttpClient, config-gated, graceful) - AI layer: DB-backed AppSetting (mode auto/manual, thresholds, AI endpoint/model/key/prompt/framework, auto-approve); OpenAI-compatible IAiAuditor (self-host/Iranian endpoints; fails safe to manual) - Pipeline: fetch → dedupe(hash) → parse → validate → AI audit → Discard/Flag/Queue/auto-publish (resolve-or-create facility) - Admin: /Admin/Settings automation+AI panel; queue shows confidence + AI verdict; flagged section - CI/CD: Dockerfile, docker-compose.prod.yml, .gitea/workflows/ci-cd.yml, nginx vhost, DEPLOY.md; forwarded headers + /healthz + prod reference-only seed; ports 22/80/443 only Co-Authored-By: Claude Opus 4.8 <noreply@anthropic.com>
2026-06-03 17:41:02 +03:30
parent 931b7b6ffb
commit 36bb165438
18 changed files with 1614 additions and 68 deletions
@@ -0,0 +1,50 @@
+using System.ComponentModel.DataAnnotations;
+
+namespace JobsMedical.Web.Models;
+
+/// <summary>
+/// Single-row (Id=1) platform settings the admin controls at runtime — chiefly the ingestion
+/// automation policy and the optional AI audit layer. Kept in the DB (not appsettings) so it's
+/// editable from the admin panel without a redeploy.
+/// </summary>
+public class AppSetting
+{
+    public int Id { get; set; } = 1;
+
+    // --- Ingestion automation ---
+    public IngestionMode Mode { get; set; } = IngestionMode.Manual;
+
+    /// <summary>In Automatic mode WITHOUT AI, listings at/above this confidence auto-publish.</summary>
+    public int AutoPublishMinConfidence { get; set; } = 85;
+
+    // --- AI audit layer (optional) ---
+    public bool AiEnabled { get; set; } = false;
+
+    /// <summary>OpenAI-compatible chat-completions endpoint (self-hosted or Iranian provider).</summary>
+    [MaxLength(500)] public string? AiEndpoint { get; set; }
+    [MaxLength(200)] public string? AiApiKey { get; set; }
+    [MaxLength(120)] public string? AiModel { get; set; } = "gpt-4o-mini";
+
+    /// <summary>The prompt + "framework" the AI follows to approve / reject / structure a listing.</summary>
+    [MaxLength(4000)]
+    public string AiSystemPrompt { get; set; } = DefaultPrompt;
+
+    /// <summary>If AI approves AND Mode is Automatic, publish without human review.</summary>
+    public bool AiAutoApprove { get; set; } = false;
+
+    public DateTime UpdatedAt { get; set; } = DateTime.UtcNow;
+
+    public const string DefaultPrompt = """
+        تو دستیار بررسی آگهی‌های کاری حوزه درمان برای پلتفرم «همکادر» هستی.
+        هر آگهی خام را بخوان و تصمیم بگیر:
+        - approve: آگهی واقعی و مرتبط با شیفت/استخدام کادر درمان است و اطلاعات کافی دارد.
+        - reject: تبلیغ، اسپم، نامرتبط، یا فاقد اطلاعات حداقلی است.
+        - review: مرتبط است اما ناقص/مبهم و نیاز به بررسی انسانی دارد.
+        نقش، شهر/محله، نوع شیفت، نوع همکاری، مبلغ یا درصد سهم، و عنوان را در صورت وجود استخراج کن.
+        فقط با یک شیء JSON پاسخ بده با کلیدهای:
+        decision (approve|reject|review)، confidence (0-100)، reason (فارسی کوتاه)،
+        kind (shift|job)، role، city، district، shiftType (day|evening|night|oncall)،
+        employmentType (fulltime|parttime|contract|plan)، payAmount (عدد تومان یا null)،
+        sharePercent (0-100 یا null)، title، facilityName.
+        """;
+}
@@ -75,3 +75,10 @@ public enum ListingKind
    Shift = 0,
    Job = 1
 }
+
+/// <summary>How ingested listings get onto the site.</summary>
+public enum IngestionMode
+{
+    Manual = 0,      // همه‌چیز به صف بررسی می‌رود؛ ادمین تأیید می‌کند
+    Automatic = 1    // موارد تأییدشده (طبق آستانه/هوش مصنوعی) خودکار منتشر می‌شوند
+}