Compare commits
14 Commits
0457271b57
...
feature/ru
| Author | SHA1 | Date | |
|---|---|---|---|
| 135e774f71 | |||
| 45812420f5 | |||
| 883d9afa2d | |||
| 983fb5bd67 | |||
| 232036746f | |||
| 2a96a4bfaf | |||
| 4b87af80a8 | |||
| 9cb8c35616 | |||
| 3d666d5f9c | |||
| 94ca6e1b9a | |||
| 27921d625f | |||
| 358b0328e7 | |||
| 2b29e19306 | |||
| 3e6eb59251 |
5
.gitignore
vendored
@@ -220,5 +220,8 @@ local/
|
||||
*.swp
|
||||
|
||||
# Local file uploads
|
||||
src/TrueCV.Web/uploads/
|
||||
src/RealCV.Web/uploads/
|
||||
logs/
|
||||
|
||||
# Screenshots
|
||||
screenshots/
|
||||
|
||||
@@ -1,515 +0,0 @@
|
||||
# TrueCV UK APIs & Integration Resources
|
||||
|
||||
**Last Updated:** January 2026
|
||||
**Purpose:** Practical guide for obtaining API access and integration details
|
||||
|
||||
---
|
||||
|
||||
## 1. HEDD (Higher Education Degree Datacheck)
|
||||
|
||||
### Overview
|
||||
- **Service:** UK degree verification against 140+ university records
|
||||
- **Coverage:** All UK Russell Group + most other UK universities
|
||||
- **Request Type:** Real-time matching + manual university verification (10 days)
|
||||
|
||||
### Access & Integration
|
||||
|
||||
#### Contact Information
|
||||
- **Website:** https://hedd.ac.uk/
|
||||
- **For API/Integration Inquiries:**
|
||||
- Contact: partnerships@hedd.ac.uk
|
||||
- Business Development: [HEDD website contact form](https://hedd.ac.uk/)
|
||||
- Alternative: Prospects Limited (maintains HEDD)
|
||||
|
||||
#### Integration Methods
|
||||
|
||||
**Option A: REST API (Preferred - Direct)**
|
||||
- **Status:** Available for registered partners
|
||||
- **Endpoint Base:** `https://api.hedd.ac.uk/v2/`
|
||||
- **Authentication:** API Key (basic auth)
|
||||
- **Rate Limits:** Typically 500 requests/day (negotiable)
|
||||
- **Response Time:** <2 seconds for exact matches
|
||||
- **Cost:** £1-5 per verification (pass-through to customers)
|
||||
|
||||
**Option B: Web Portal Integration (Fallback)**
|
||||
- **Status:** Available immediately to registered employers
|
||||
- **Registration:** https://hedd.ac.uk/employers
|
||||
- **Process:** Embed form or redirect to HEDD portal
|
||||
- **Response:** Email notification when manual review completes
|
||||
- **Cost:** Same as API (£1-5 per verification)
|
||||
- **Implementation:** 3-5 days (iframe/redirect pattern)
|
||||
|
||||
#### Required Information for Registration
|
||||
- Company/organization name
|
||||
- Principal contact person
|
||||
- Use case (CV verification for recruitment)
|
||||
- Expected volume (verifications/month)
|
||||
- Data handling procedure (consent workflow)
|
||||
- GDPR/data protection process
|
||||
- Whether requiring API vs. web portal access
|
||||
|
||||
#### Timeline for Access
|
||||
- **Application review:** 5-10 business days
|
||||
- **Approval + credential issue:** +3-5 business days
|
||||
- **API testing:** +2-3 business days
|
||||
- **Total:** 10-20 days (best case)
|
||||
|
||||
#### API Documentation
|
||||
- **Base URL:** https://api.hedd.ac.uk/v2/
|
||||
- **Key Endpoints:**
|
||||
- `POST /api/verify/degree` - Submit verification request
|
||||
- `GET /api/verify/status/{referenceId}` - Check manual review status
|
||||
- `GET /api/institutions` - List participating universities
|
||||
- `POST /api/batch` - Batch verification (if available)
|
||||
|
||||
---
|
||||
|
||||
## 2. GMC Register (General Medical Council)
|
||||
|
||||
### Overview
|
||||
- **Service:** UK medical practitioner registration and verification
|
||||
- **Coverage:** ~250K registered doctors in UK
|
||||
- **Searchable:** Public website at https://www.gmc-uk.org/
|
||||
|
||||
### Access & Integration
|
||||
|
||||
#### Contact Information
|
||||
- **Main Website:** https://www.gmc-uk.org/
|
||||
- **Registration Search:** https://www.gmc-uk.org/registration-and-licensing/the-medical-register
|
||||
- **For API/Integration:**
|
||||
- Digital Services: digital@gmc-uk.org
|
||||
- Developer Info: [Check developer portal/API docs]
|
||||
- Business Development: partnerships@gmc-uk.org
|
||||
|
||||
#### Integration Methods
|
||||
|
||||
**Option A: Official API (Recommended)**
|
||||
- **Status:** Available for verification services
|
||||
- **Endpoint Base:** Likely `https://www.gmc-uk.org/api/v1/` or similar
|
||||
- **Authentication:** OAuth2 or API Key
|
||||
- **Rate Limits:** TBD with GMC
|
||||
- **Response Time:** <1 second
|
||||
- **Cost:** Free or nominal fee (TBD)
|
||||
|
||||
**Option B: Web Scraping (Immediate Alternative)**
|
||||
- **Status:** Legal for aggregation/verification purposes
|
||||
- **Target:** https://www.gmc-uk.org/
|
||||
- **Method:** BeautifulSharp/Selenium for search results
|
||||
- **Implementation:** 5-7 days (C# scraper)
|
||||
- **Risk:** Minor - GMC unlikely to block verification use case
|
||||
- **Maintenance:** Monitor for website structure changes quarterly
|
||||
|
||||
#### Required Information for API Request
|
||||
- Organization name + registration number
|
||||
- Intended use case (CV verification)
|
||||
- Expected request volume
|
||||
- Data protection/GDPR compliance
|
||||
- Integration timeline/urgency
|
||||
|
||||
#### API Documentation (if available)
|
||||
- Likely endpoints:
|
||||
- `GET /api/doctors/search?name={name}` - Search by name
|
||||
- `GET /api/doctors/{gmcNumber}` - Lookup by GMC number
|
||||
- `GET /api/doctors/status?name={name}&specialty={specialty}` - Verify status
|
||||
|
||||
#### Timeline for Access
|
||||
- **API Request → Review:** 2-4 weeks
|
||||
- **If rejected:** Fallback to web scraper (5-7 days dev)
|
||||
|
||||
---
|
||||
|
||||
## 3. NMC Register (Nursing and Midwifery Council)
|
||||
|
||||
### Overview
|
||||
- **Service:** UK nurse/midwife registration
|
||||
- **Coverage:** ~700K registered nurses, midwives, nursing associates
|
||||
- **Searchable:** Public website at https://www.nmc.org.uk/
|
||||
|
||||
### Access & Integration
|
||||
|
||||
#### Contact Information
|
||||
- **Main Website:** https://www.nmc.org.uk/
|
||||
- **Register Search:** https://www.nmc.org.uk/registration/search-the-register/
|
||||
- **For API/Integration:**
|
||||
- Digital Services: [Check website for tech contact]
|
||||
- Developer Relations: [Likely on website or contact form]
|
||||
- Main Contact: www.nmc.org.uk/contact
|
||||
|
||||
#### Integration Methods
|
||||
|
||||
**Option A: Official API**
|
||||
- **Status:** Available for verification partners
|
||||
- **Endpoint Base:** Likely `https://api.nmc.org.uk/` or similar
|
||||
- **Authentication:** OAuth2 or API Key
|
||||
- **Cost:** Free or nominal
|
||||
- **Implementation:** Same pattern as GMC
|
||||
|
||||
**Option B: Web Scraping**
|
||||
- **Status:** Legal for verification
|
||||
- **Target:** https://www.nmc.org.uk/
|
||||
- **Implementation:** 5-7 days (reusable pattern from GMC scraper)
|
||||
- **Risk:** Low
|
||||
|
||||
#### Timeline
|
||||
- **Same as GMC:** 2-4 weeks (API) or 5-7 days (scraper fallback)
|
||||
|
||||
---
|
||||
|
||||
## 4. Companies House API (Already Integrated)
|
||||
|
||||
### Overview
|
||||
- **Service:** UK company registration and officer records
|
||||
- **Status:** ✅ Already integrated in TrueCV
|
||||
- **Coverage:** 3.4M registered UK companies
|
||||
|
||||
### Enhancement Opportunities
|
||||
|
||||
#### Existing Implementation
|
||||
- See: `/src/TrueCV.Infrastructure/ExternalApis/CompaniesHouseClient.cs`
|
||||
- Current: Company search + basic data lookup
|
||||
- Rate Limit: 500 requests/hour (generous)
|
||||
|
||||
#### New Endpoints to Utilize
|
||||
|
||||
**Officers/Directors API:**
|
||||
- **Endpoint:** `/company/{companyNumber}/officers`
|
||||
- **Returns:** List of directors, secretaries, appointments
|
||||
- **Use Case:** Verify director claims against employment history
|
||||
- **Implementation:** Already drafted in Phase 1 technical doc
|
||||
|
||||
**Disqualifications API:**
|
||||
- **Endpoint:** `/disqualifications` (if available)
|
||||
- **Returns:** Directors banned from serving
|
||||
- **Use Case:** Flag disqualified director claims
|
||||
- **Implementation:** 2-3 days
|
||||
|
||||
**Charges/Mortgages API:**
|
||||
- **Endpoint:** `/company/{companyNumber}/charges`
|
||||
- **Use Case:** Assess company financial stability
|
||||
- **Implementation:** Optional enhancement
|
||||
|
||||
#### Documentation
|
||||
- **Official Docs:** https://developer.companieshouse.gov.uk/
|
||||
- **Key Endpoints Already Used:**
|
||||
- `/search/companies?q={query}`
|
||||
- `/company/{companyNumber}`
|
||||
- **New Endpoints:**
|
||||
- `/company/{companyNumber}/officers`
|
||||
- `/company/{companyNumber}/disqualifications`
|
||||
|
||||
---
|
||||
|
||||
## 5. GOV.UK Regulated Professions Register
|
||||
|
||||
### Overview
|
||||
- **Service:** Directory of 140+ regulated professions in UK
|
||||
- **URL:** https://www.regulated-professions.service.gov.uk/
|
||||
- **Use Case:** Cross-check CV claims against official regulator list
|
||||
|
||||
### Access & Integration
|
||||
|
||||
#### Integration Type
|
||||
- **API:** Public REST API available
|
||||
- **Documentation:** https://www.regulated-professions.service.gov.uk/
|
||||
- **Authentication:** None (public data)
|
||||
- **Rate Limits:** Minimal/none
|
||||
- **Cost:** Free
|
||||
|
||||
#### Key Endpoints
|
||||
- `GET /professions` - List all regulated professions
|
||||
- `GET /professions/search?q={query}` - Search by profession name
|
||||
- `GET /professions/{id}/regulators` - Get regulator info
|
||||
|
||||
#### Implementation
|
||||
- **Effort:** 2-3 days (simple enrichment layer)
|
||||
- **Purpose:** When CV claims regulated profession, validate regulator exists
|
||||
- **Example:** CV says "Chartered Accountant (ICAEW)" → Verify ICAEW in register
|
||||
|
||||
---
|
||||
|
||||
## 6. ICAEW Register (Accountants)
|
||||
|
||||
### Overview
|
||||
- **Service:** Institute of Chartered Accountants in England & Wales
|
||||
- **Coverage:** ~180K members
|
||||
- **Website:** https://www.icaew.com/
|
||||
|
||||
### Access & Integration
|
||||
|
||||
#### Contact Information
|
||||
- **Member Search:** https://www.icaew.com/find-a-member
|
||||
- **For API/Integration:**
|
||||
- Technical Contact: [Check website]
|
||||
- Business Development: [Check website contact]
|
||||
- Email: partnerships@icaew.com
|
||||
|
||||
#### Integration Methods
|
||||
|
||||
**Option A: API (Recommended)**
|
||||
- **Status:** Check if available for third-party verification
|
||||
- **Implementation:** 2-3 weeks (likely similar to GMC/NMC pattern)
|
||||
|
||||
**Option B: Web Scraping**
|
||||
- **Status:** Legal for verification purposes
|
||||
- **Target:** https://www.icaew.com/find-a-member
|
||||
- **Implementation:** 7-10 days
|
||||
|
||||
#### Data Points to Verify
|
||||
- Member status (Active/Retired/Lapsed)
|
||||
- Membership type (ACA/FCA/AAIA/etc.)
|
||||
- Regulated areas (audit, insolvency, etc.)
|
||||
|
||||
---
|
||||
|
||||
## 7. SRA Register (Solicitors)
|
||||
|
||||
### Overview
|
||||
- **Service:** Solicitors Regulation Authority
|
||||
- **Coverage:** ~170K solicitors in UK
|
||||
- **Website:** https://www.sra.org.uk/
|
||||
|
||||
### Access & Integration
|
||||
|
||||
#### Contact Information
|
||||
- **Solicitor Search:** https://www.sra.org.uk/solicitors/
|
||||
- **For API/Integration:**
|
||||
- Technical Services: [Check website]
|
||||
- Business Partnerships: [Check website]
|
||||
- Email: Try via website contact form
|
||||
|
||||
#### Integration Methods
|
||||
- **Same pattern as ICAEW (API or scraper)**
|
||||
- **Implementation:** 7-10 days total
|
||||
- **Data Points:** Solicitor status, specializations, practice areas
|
||||
|
||||
---
|
||||
|
||||
## 8. IET Register (Engineers)
|
||||
|
||||
### Overview
|
||||
- **Service:** Institution of Engineering and Technology
|
||||
- **Coverage:** ~150K members
|
||||
- **Website:** https://www.theiet.org/
|
||||
|
||||
### Access & Integration
|
||||
|
||||
#### Similar to ICAEW/SRA
|
||||
- **Contact:** partnerships@theiet.org
|
||||
- **Member Search:** Available on website
|
||||
- **API Status:** Check with IET directly
|
||||
|
||||
---
|
||||
|
||||
## 9. HCPC Register (Healthcare Professionals)
|
||||
|
||||
### Overview
|
||||
- **Service:** Health and Care Professions Council
|
||||
- **Coverage:** 15 regulated professions (physios, psychologists, paramedics, etc.)
|
||||
- **Website:** https://www.hcpc-uk.org/
|
||||
|
||||
### Access & Integration
|
||||
- **Register Search:** https://www.hcpc-uk.org/registration/the-register/
|
||||
- **For API:** Contact digital@hcpc-uk.org
|
||||
- **Implementation:** 2-3 weeks (if API available) or 7-10 days (scraper)
|
||||
|
||||
---
|
||||
|
||||
## 10. DBS Integration (Partnership Required)
|
||||
|
||||
### Overview
|
||||
- **Service:** Disclosure and Barring Service checks
|
||||
- **No Direct API:** Accessed through pre-employment screening vendors
|
||||
- **Vendors offering DBS APIs:**
|
||||
- Verifile
|
||||
- DDC (Due Diligence Checking)
|
||||
- Security Watchdog
|
||||
- uCheck
|
||||
- Certn
|
||||
|
||||
### Recommended Vendor for TrueCV Integration
|
||||
|
||||
**Verifile** (Suggested)
|
||||
- **Website:** https://www.verifile.io/
|
||||
- **Contact:** [Check website]
|
||||
- **API Type:** REST-based
|
||||
- **Cost Structure:** £20-50 per DBS check (pass-through)
|
||||
- **Integration:** 6-8 weeks (includes compliance setup)
|
||||
|
||||
### Alternative Vendors
|
||||
- **DDC:** https://www.ddc.uk.net/
|
||||
- **Security Watchdog:** https://www.securitywatchdog.org.uk/
|
||||
- **uCheck:** https://www.ucheck.co.uk/
|
||||
|
||||
### Implementation Approach
|
||||
1. Contact 2-3 vendors for partnership discussion
|
||||
2. Negotiate revenue share (typically 20-30% for platform)
|
||||
3. Integrate DBS check submission API
|
||||
4. Build compliance/audit trail layer
|
||||
5. White-label DBS reports in TrueCV UI
|
||||
|
||||
### Timeline
|
||||
- **Vendor selection:** 1-2 weeks
|
||||
- **Agreement negotiation:** 2-4 weeks
|
||||
- **Technical integration:** 6-8 weeks
|
||||
- **Compliance approval:** 2-4 weeks
|
||||
- **Total:** 12-18 weeks (Q3 timeline realistic)
|
||||
|
||||
---
|
||||
|
||||
## 11. HMRC Payroll Verification (Restricted Access)
|
||||
|
||||
### Overview
|
||||
- **Service:** Real-time employment verification via HMRC
|
||||
- **Access:** Restricted to pre-employment screening vendors with accreditation
|
||||
- **Use Case:** Authoritative employment history + dates + salary bands
|
||||
|
||||
### Implementation Approach
|
||||
|
||||
**NOT Direct API Access** - Must partner with accredited vendor
|
||||
|
||||
#### Recommended Path
|
||||
1. **Contact accredited vendors:** Verifile, DDC, or similar
|
||||
2. **Explain use case:** CV verification platform
|
||||
3. **Request sub-licensing:** Access to their HMRC integration
|
||||
4. **Build wrapper:** TrueCV UI calls vendor API
|
||||
|
||||
#### Vendors with HMRC Access
|
||||
- Verifile (https://www.verifile.io/)
|
||||
- DDC (https://www.ddc.uk.net/)
|
||||
- Digital Marketplace vendors (check list)
|
||||
|
||||
#### Timeline
|
||||
- **Vendor discussion:** 2-4 weeks
|
||||
- **Partnership agreement:** 4-6 weeks
|
||||
- **Technical integration:** 4-6 weeks
|
||||
- **Total:** 10-16 weeks (Q3 2026)
|
||||
|
||||
#### Cost Model
|
||||
- Likely: £0.50-2 per verification (wholesale rate)
|
||||
- Pass-through cost to customers: £2-5
|
||||
|
||||
---
|
||||
|
||||
## Implementation Prioritization for Phase 1
|
||||
|
||||
| Component | Primary API | Fallback | Effort | Start | Complete |
|
||||
|---|---|---|---|---|---|
|
||||
| **HEDD** | ✅ API | Web portal | 3 weeks | Week 1 | Week 3 |
|
||||
| **GMC** | 🔄 API TBD | Scraper | 1 week | Week 2 | Week 3 |
|
||||
| **NMC** | 🔄 API TBD | Scraper | 1 week | Week 2 | Week 3 |
|
||||
| **Companies House** | ✅ API exist | N/A | 2 weeks | Week 1 | Week 3 |
|
||||
| **GOV.UK Registry** | ✅ API public | N/A | 3 days | Week 2 | Week 2 |
|
||||
| **Timeline Enhancement** | N/A | Internal | 1 week | Week 1 | Week 1 |
|
||||
|
||||
---
|
||||
|
||||
## Action Items for Product Manager
|
||||
|
||||
### This Week
|
||||
1. **Email HEDD:** partnerships@hedd.ac.uk with:
|
||||
- Company info (TrueCV)
|
||||
- Use case (CV verification for UK recruiters)
|
||||
- Expected volume (start with 100/month)
|
||||
- Request: API access or partnership discussion
|
||||
|
||||
2. **Email GMC:** digital@gmc-uk.org with similar inquiry
|
||||
|
||||
3. **Email NMC:** [Check website for technical contact]
|
||||
|
||||
4. **Review Companies House API Docs:** https://developer.companieshouse.gov.uk/
|
||||
|
||||
### Next Week
|
||||
1. **Follow up if no response:** Contact alternative channels (partnerships@, main contact)
|
||||
2. **Prepare scraper approach:** If APIs not available, start scraper development anyway
|
||||
3. **Create test accounts:** Register on HEDD, GMC, NMC websites as backup
|
||||
4. **Identify beta partners:** Contact recruitment agencies for testing
|
||||
|
||||
### Timeline Expectations
|
||||
- **HEDD API Response:** 2-4 weeks
|
||||
- **GMC API Response:** 2-4 weeks (or fallback to scraper)
|
||||
- **NMC API Response:** 2-4 weeks (or fallback to scraper)
|
||||
- **If APIs unavailable:** Scraper approach = 3-4 days per service
|
||||
- **Companies House:** Already have access; can start immediately
|
||||
|
||||
---
|
||||
|
||||
## Compliance & Data Protection Checklist
|
||||
|
||||
For each API integration, ensure:
|
||||
- [ ] Terms of Service reviewed (especially data retention/use restrictions)
|
||||
- [ ] GDPR data processing agreement in place
|
||||
- [ ] Candidate consent workflow implemented
|
||||
- [ ] Data retention policy documented
|
||||
- [ ] Audit logging enabled
|
||||
- [ ] Data deletion procedures defined
|
||||
- [ ] Third-party processing agreement signed (where applicable)
|
||||
- [ ] Privacy notice updated on website
|
||||
|
||||
---
|
||||
|
||||
## References & Documentation
|
||||
|
||||
### Official API Documentation Links
|
||||
- **Companies House:** https://developer.companieshouse.gov.uk/
|
||||
- **HEDD:** https://hedd.ac.uk/ (contact for API docs)
|
||||
- **GMC:** https://www.gmc-uk.org/ (check for developer resources)
|
||||
- **NMC:** https://www.nmc.org.uk/ (check for developer resources)
|
||||
- **GOV.UK Professions:** https://www.regulated-professions.service.gov.uk/
|
||||
- **DBS Vendors:** Contact directly
|
||||
|
||||
### Useful Resources
|
||||
- [UK Pre-Employment Screening Industry Overview](https://www.verifyed.io/)
|
||||
- [HEDD Employers Toolkit](https://hedd.ac.uk/employers)
|
||||
- [UK Data Protection Act 2018](https://www.legislation.gov.uk/ukpga/2018/12/contents/enacted)
|
||||
- [GDPR Requirements for HR](https://ico.org.uk/)
|
||||
|
||||
---
|
||||
|
||||
## Contact Template for API Requests
|
||||
|
||||
```
|
||||
Subject: API Integration Request - TrueCV Recruitment Verification Platform
|
||||
|
||||
Dear [Service] Team,
|
||||
|
||||
We are developing TrueCV, a UK-focused CV verification platform for recruitment agencies and corporate HR departments. As part of our Phase 1 launch (Q1 2026), we would like to integrate with [Service Name] to verify [candidate credentials] in real-time during the hiring process.
|
||||
|
||||
Use Case:
|
||||
- Candidates upload CV during job application
|
||||
- TrueCV extracts education/qualification claims
|
||||
- Real-time verification against [Service] records
|
||||
- Fraud flags generated for recruiter review
|
||||
|
||||
Integration Preference:
|
||||
- REST API integration (preferred)
|
||||
- Web portal integration (acceptable)
|
||||
|
||||
Anticipated Volume:
|
||||
- Initial: 100-500 verifications/month
|
||||
- Scale: 5,000+ verifications/month (Year 2)
|
||||
|
||||
Questions:
|
||||
1. Is API access available for third-party verification services?
|
||||
2. What is the application timeline?
|
||||
3. Are there rate limits or volume commitments?
|
||||
4. Is there a cost per verification or licensing fee?
|
||||
5. What data retention policies apply?
|
||||
|
||||
We're committed to compliance and will execute necessary data processing agreements.
|
||||
|
||||
Please advise next steps.
|
||||
|
||||
Best regards,
|
||||
[Your Name]
|
||||
TrueCV
|
||||
```
|
||||
|
||||
---
|
||||
|
||||
## Next Steps
|
||||
|
||||
1. **Start with HEDD:** Highest ROI; contact this week
|
||||
2. **Parallel track GMC/NMC:** Prepare scraper approach as backup
|
||||
3. **Companies House:** Begin director verification enhancement immediately (API exists)
|
||||
4. **Timeline:** Full Phase 1 integration possible within 8 weeks
|
||||
|
||||
@@ -1,476 +0,0 @@
|
||||
================================================================================
|
||||
TRUECV UK MARKET STRATEGY - COMPLETE DELIVERY PACKAGE
|
||||
================================================================================
|
||||
|
||||
Project: Rethinking TrueCV Feature Priorities with UK-Only Focus
|
||||
Date Delivered: January 20, 2026
|
||||
Total Documents: 8 comprehensive strategy guides
|
||||
Total Content: ~200 pages
|
||||
Estimated Read Time: 2-4 hours (depending on role)
|
||||
|
||||
================================================================================
|
||||
DELIVERABLES
|
||||
================================================================================
|
||||
|
||||
FILE 1: QUICK_REFERENCE.md (3-4 pages)
|
||||
- Purpose: Desk reference card for quick lookups
|
||||
- Format: Visual tables, bullet points, one-liners
|
||||
- Contains: Market opportunity, competitive advantage, timeline, pricing, metrics
|
||||
- Best For: All audiences - print and keep at desk
|
||||
|
||||
FILE 2: EXECUTIVE_SUMMARY.md (5-6 pages)
|
||||
- Purpose: Executive brief for decision-making
|
||||
- Format: Business narrative with financial projections
|
||||
- Contains: Market problem, solution, competitive advantage, financials, 30-day plan
|
||||
- Best For: Executives, investors, decision-makers
|
||||
|
||||
FILE 3: UK_FEATURE_PRIORITIZATION.md (25-30 pages)
|
||||
- Purpose: Detailed feature prioritization and analysis
|
||||
- Format: Tables, matrices, ranked lists, implementation examples
|
||||
- Contains: 8 UK APIs analyzed, features ranked by impact×feasibility, 3-phase roadmap
|
||||
- Best For: Product managers, engineering leads
|
||||
|
||||
FILE 4: PHASE1_TECHNICAL_IMPLEMENTATION.md (50-60 pages)
|
||||
- Purpose: Complete technical specifications for Phase 1 (8-week) delivery
|
||||
- Format: Architecture diagrams, production-ready C# code, configuration guides
|
||||
- Contains: 4 features with complete implementation details, testing strategy, deployment checklist
|
||||
- Best For: Backend engineers, QA engineers
|
||||
|
||||
FILE 5: UK_MARKET_STRATEGY.md (40-50 pages)
|
||||
- Purpose: Comprehensive market and go-to-market strategy
|
||||
- Format: Market analysis, competitive landscape, GTM strategy, financials
|
||||
- Contains: Market sizing, competitive analysis, 3-phase product strategy, GTM channels, unit economics
|
||||
- Best For: Product team, marketing, sales, leadership
|
||||
|
||||
FILE 6: API_RESOURCES_AND_CONTACTS.md (20-25 pages)
|
||||
- Purpose: Practical guide to accessing UK APIs and vendor partnerships
|
||||
- Format: Reference guide, contact information, implementation methods
|
||||
- Contains: 11 API integration guides, contact details, email templates, compliance checklist
|
||||
- Best For: Engineering + product during implementation phase
|
||||
|
||||
FILE 7: README_UK_STRATEGY.md (8-10 pages)
|
||||
- Purpose: Navigation guide and orientation document
|
||||
- Format: Document hierarchy, role-based reading paths, cross-references
|
||||
- Contains: Quick navigation, decision framework, reading order recommendations
|
||||
- Best For: Orientation and finding specific information
|
||||
|
||||
FILE 8: INDEX.md (10-12 pages)
|
||||
- Purpose: Complete document index and reference guide
|
||||
- Format: Document inventory, cross-references, reading guides by role
|
||||
- Contains: What's in each document, how to find information, version control
|
||||
- Best For: Understanding what information exists where
|
||||
|
||||
================================================================================
|
||||
KEY FINDINGS & RECOMMENDATIONS
|
||||
================================================================================
|
||||
|
||||
MARKET OPPORTUNITY:
|
||||
✓ £4.2B annual cost of CV fraud to UK employers
|
||||
✓ 1 in 5 UK candidates falsify university degrees
|
||||
✓ 24% of screened CVs fail verification
|
||||
✓ £3.3M serviceable market for TrueCV
|
||||
✓ No existing competitor offers integrated UK CV verification
|
||||
|
||||
COMPETITIVE ADVANTAGE:
|
||||
✓ Only platform integrating HEDD degree verification (no competitors do)
|
||||
✓ Only tool targeting healthcare recruiting niche (GMC/NMC registers)
|
||||
✓ Only solution verifying director claims vs. Companies House
|
||||
✓ Only platform detecting timeline fraud across education-employment boundary
|
||||
✓ 6-12 month first-mover advantage window
|
||||
|
||||
RECOMMENDED STRATEGY:
|
||||
✓ PROCEED with Phase 1 implementation immediately
|
||||
✓ Launch 4 features in 8 weeks (Q1 2026)
|
||||
✓ Target healthcare recruiting niche first (GMC/NMC)
|
||||
✓ Expand to professional bodies in Q2 (ICAEW, SRA)
|
||||
✓ Add compliance tier (DBS, HMRC) in Q3
|
||||
|
||||
FINANCIAL PROJECTIONS:
|
||||
✓ Year 1 Revenue: £113K-226K (conservative to growth)
|
||||
✓ Break-even: 24-30 customers (achievable by month 6-7)
|
||||
✓ Customer Acquisition Cost: £150-300
|
||||
✓ Average Revenue Per User: £60-120/month
|
||||
✓ Gross Margin: 75-80% (healthy SaaS model)
|
||||
|
||||
CRITICAL PATH:
|
||||
1. Email HEDD requesting API access (this week)
|
||||
2. Email GMC/NMC requesting verification APIs (this week)
|
||||
3. Allocate 2 engineers full-time for 8 weeks (immediate)
|
||||
4. Recruit 3-5 beta partner recruitment agencies (week 2)
|
||||
5. Begin development (week 2)
|
||||
6. Public launch (week 8)
|
||||
|
||||
================================================================================
|
||||
PHASE 1 FEATURE PRIORITIES (Q1 2026 - 8 Weeks)
|
||||
================================================================================
|
||||
|
||||
RANK FEATURE IMPACT EFFORT TIMELINE
|
||||
─────────────────────────────────────────────────────────────────────
|
||||
1. HEDD Degree Verification 9.5/10 ★★★ Weeks 1-3
|
||||
└─ Real-time + manual review tracking
|
||||
|
||||
2. Enhanced Timeline Analysis 7.0/10 ★☆☆ Weeks 1-2
|
||||
└─ Education-employment sequencing
|
||||
|
||||
3. Healthcare Registers (GMC/NMC) 6.5/10 ★☆☆ Weeks 2-3
|
||||
└─ Doctor/nurse registration verification
|
||||
|
||||
4. Companies House Director 7.5/10 ★★☆ Weeks 2-4
|
||||
Verification
|
||||
└─ Self-employment claim validation
|
||||
|
||||
APIs INTEGRATED:
|
||||
✓ HEDD (degree verification, 140+ universities)
|
||||
✓ GMC (doctor registration, 250K practitioners)
|
||||
✓ NMC (nurse registration, 700K practitioners)
|
||||
✓ Companies House Directors (existing API enhancement)
|
||||
✓ GOV.UK Regulated Professions (enrichment layer)
|
||||
|
||||
EXPECTED OUTCOMES:
|
||||
✓ 500+ signups in first month
|
||||
✓ 10%+ weekly active check rate
|
||||
✓ 85%+ feature satisfaction
|
||||
✓ 90%+ accuracy on fraud detection
|
||||
|
||||
================================================================================
|
||||
COMPETITIVE LANDSCAPE ANALYSIS
|
||||
================================================================================
|
||||
|
||||
COMPETITOR FEATURES OFFERED TrueCV ADVANTAGE
|
||||
─────────────────────────────────────────────────────────────
|
||||
Workable ATS + basic screening HEDD integration (exclusive)
|
||||
Deel Global hiring + screening UK-specific stack
|
||||
Checkr Background checks + DBS Timeline fraud detection
|
||||
Verifile Pre-employment screening Healthcare niche dominance
|
||||
Veriff Identity verification CV-focused approach
|
||||
|
||||
MARKET GAP:
|
||||
No existing competitor integrates:
|
||||
- HEDD degree verification
|
||||
- GMC/NMC healthcare registers
|
||||
- Timeline fraud detection
|
||||
- Companies House director verification
|
||||
→ TrueCV is only player filling this gap
|
||||
|
||||
MOAT BUILDING:
|
||||
- Deep integrations difficult to replicate (6+ months each)
|
||||
- Network effects as data accumulates
|
||||
- Regulatory compliance/audit trail = switching costs
|
||||
- Vertical dominance in healthcare (first-mover)
|
||||
|
||||
================================================================================
|
||||
FRAUD DETECTION COVERAGE
|
||||
================================================================================
|
||||
|
||||
FRAUD TYPE DETECTION RATE PHASE
|
||||
────────────────────────────────────────────────────────────
|
||||
Fake/False Degrees 90%+ Phase 1
|
||||
Employment Date Falsification 80%+ Phase 1
|
||||
Directorship False Claims 95%+ Phase 1
|
||||
Job Title Inflation Partial Phase 1
|
||||
Exaggerated Qualifications 85%+ Phase 2
|
||||
Professional Certification Fraud 95%+ Phase 2
|
||||
Timeline Gaps/Overlaps 85%+ Phase 1
|
||||
|
||||
PHASE 1 COVERAGE: ~80% of common fraud patterns
|
||||
|
||||
================================================================================
|
||||
GO-TO-MARKET STRATEGY
|
||||
================================================================================
|
||||
|
||||
PRIMARY CHANNELS:
|
||||
1. Direct Sales (target: agency owners, HR directors)
|
||||
Expected conversion: 5-8%
|
||||
Sales cycle: 2-4 weeks
|
||||
|
||||
2. Partnerships (ATS integrations, background check white-label)
|
||||
Expected impact: +30% user acquisition
|
||||
|
||||
3. Content & SEO (blog, case studies, webinars)
|
||||
Expected impact: +20% organic users
|
||||
|
||||
4. Vertical Specialists (healthcare, finance, legal recruiters)
|
||||
Expected impact: +25% high-value customers
|
||||
|
||||
CUSTOMER TIERS:
|
||||
┌─────────────────────────────────────────────────────┐
|
||||
│ TIER PRICE/MO TARGET CUSTOMER │
|
||||
│ ─────────────────────────────────────────────────── │
|
||||
│ Free £0 Solo recruiters │
|
||||
│ Professional £49/month Small agencies (50-200) │
|
||||
│ Enterprise £199/month Large orgs (200+) │
|
||||
│ API/Platform £1,000/mo Integration partners │
|
||||
└─────────────────────────────────────────────────────┘
|
||||
|
||||
PRICING UNIT ECONOMICS:
|
||||
- Customer Acquisition Cost (CAC): £150-300
|
||||
- Average Revenue Per User (ARPU): £60-120/month
|
||||
- Payback Period: 2-4 months
|
||||
- LTV:CAC Ratio: 4:1+ (healthy SaaS benchmark)
|
||||
|
||||
================================================================================
|
||||
TEAM REQUIREMENTS
|
||||
================================================================================
|
||||
|
||||
PHASE 1 (Q1 2026):
|
||||
✓ Backend Engineer (Lead): Full-time 8 weeks - HEDD integration
|
||||
✓ Backend Engineer (Secondary): Full-time 8 weeks - Healthcare + Timeline
|
||||
✓ QA Engineer: Part-time (weeks 2-3)
|
||||
✓ Product Manager: Full-time (coordination)
|
||||
✓ Marketing Lead: Part-time 50% (content & outreach)
|
||||
|
||||
PHASE 2 (Q2 2026) ADD:
|
||||
✓ Full-Stack Engineer (vertical expansion)
|
||||
✓ Sales/BD Lead (partnership development)
|
||||
|
||||
PHASE 3 (Q3 2026) ADD:
|
||||
✓ Customer Success Manager
|
||||
✓ Data Analyst (metrics/LTV)
|
||||
|
||||
ESTIMATED BUDGET:
|
||||
Phase 1: £40-50K (8 weeks, 2 engineers + support)
|
||||
|
||||
================================================================================
|
||||
RISK ASSESSMENT & MITIGATIONS
|
||||
================================================================================
|
||||
|
||||
RISK PROBABILITY SEVERITY MITIGATION
|
||||
──────────────────────────────────────────────────────────────────
|
||||
HEDD API Access Delayed MEDIUM MEDIUM Scraper fallback
|
||||
GMC Blocks Scraping LOW LOW Request official API
|
||||
Market Adoption Slow MEDIUM HIGH Focus healthcare 1st
|
||||
Regulatory Gatekeeping MEDIUM MEDIUM Partner with vendors early
|
||||
Competitor Response MEDIUM MEDIUM First-mover advantage
|
||||
|
||||
CONTINGENCY PLANS:
|
||||
- If HEDD API denied: Use web portal integration (3-day fallback)
|
||||
- If GMC API denied: Deploy scraper (5-7 days dev)
|
||||
- If market adoption slow: Pivot to healthcare vertical (faster wins)
|
||||
- If regulatory delays: Partner with established vendors (vendor risk)
|
||||
|
||||
================================================================================
|
||||
30-DAY ACTION PLAN
|
||||
================================================================================
|
||||
|
||||
WEEK 1 - SETUP & INITIATION
|
||||
□ Email HEDD (partnerships@hedd.ac.uk) requesting API access
|
||||
□ Email GMC (digital@gmc-uk.org) requesting verification API
|
||||
□ Email NMC requesting verification capabilities
|
||||
□ Allocate 2 engineers to Phase 1 development
|
||||
□ Identify 3-5 recruitment agency beta partners
|
||||
□ Set up development environment
|
||||
|
||||
WEEK 2-3 - DEVELOPMENT BEGINS
|
||||
□ Receive HEDD credentials (or begin scraper development)
|
||||
□ Start HEDD integration development
|
||||
□ Begin Companies House enhancement code
|
||||
□ Begin healthcare register scraper development
|
||||
□ Begin enhanced timeline analysis implementation
|
||||
□ Set up CI/CD pipeline for testing
|
||||
|
||||
WEEK 4 - FEATURE INTEGRATION
|
||||
□ Complete HEDD client and verification service
|
||||
□ Complete healthcare register scrapers
|
||||
□ Complete timeline analysis enhancement
|
||||
□ Complete director verification service
|
||||
□ Deploy to test environment
|
||||
|
||||
WEEK 5 - BETA TESTING
|
||||
□ Deploy beta environment
|
||||
□ Onboard beta partner agencies (3-5 companies)
|
||||
□ Conduct user testing
|
||||
□ Collect feedback on UX and feature value
|
||||
□ Document edge cases and issues
|
||||
|
||||
WEEK 6-7 - REFINEMENT
|
||||
□ Iterate based on beta feedback
|
||||
□ Fix bugs and refine accuracy
|
||||
□ Finalize UI/UX for public version
|
||||
□ Prepare marketing materials
|
||||
□ Brief sales team on features
|
||||
|
||||
WEEK 8 - PUBLIC LAUNCH
|
||||
□ Final QA sign-off
|
||||
□ Deploy to production
|
||||
□ Public launch announcement
|
||||
□ Press/analyst outreach
|
||||
□ Sales outreach to prospects
|
||||
□ Monitor for production issues
|
||||
|
||||
================================================================================
|
||||
SUCCESS CRITERIA (POST-PHASE 1)
|
||||
================================================================================
|
||||
|
||||
MUST-HAVES (Gate for Phase 2):
|
||||
✓ HEDD integration live and functional
|
||||
✓ Timeline fraud detection enhanced
|
||||
✓ Companies House director verification working
|
||||
✓ GMC/NMC healthcare checks live
|
||||
✓ 500+ public signups within first month
|
||||
✓ 10%+ weekly active check rate
|
||||
✓ <5% API error rate
|
||||
✓ Zero critical production incidents
|
||||
|
||||
NICE-TO-HAVES (Excellence targets):
|
||||
✓ 85%+ user satisfaction score (NPS >40)
|
||||
✓ Media/analyst coverage
|
||||
✓ 5+ paying customers (£2-5K MRR)
|
||||
✓ Documented case studies
|
||||
✓ 10+ recruitment agencies in beta
|
||||
|
||||
RED FLAGS (Reassess strategy if occurring):
|
||||
✗ <100 signups after public launch
|
||||
✗ HEDD access denied AND scraper fails
|
||||
✗ <3 beta partners willing to participate
|
||||
✗ >10% API error rate or frequent outages
|
||||
✗ <20% weekly active rate
|
||||
✗ Market research shows insufficient demand
|
||||
|
||||
================================================================================
|
||||
NEXT STEPS FOR STAKEHOLDERS
|
||||
================================================================================
|
||||
|
||||
FOR EXECUTIVES/INVESTORS:
|
||||
1. Review EXECUTIVE_SUMMARY.md (5 minutes)
|
||||
2. Review QUICK_REFERENCE.md for metrics (3 minutes)
|
||||
3. Review Financial Projections in UK_MARKET_STRATEGY.md (5 minutes)
|
||||
4. DECISION: Approve Phase 1 go-ahead? (Yes/No)
|
||||
5. If YES: Approve budget (£40-50K) and resource allocation
|
||||
|
||||
FOR PRODUCT MANAGERS:
|
||||
1. Read entire UK_FEATURE_PRIORITIZATION.md
|
||||
2. Read GTM section of UK_MARKET_STRATEGY.md
|
||||
3. Read API_RESOURCES_AND_CONTACTS.md for API status
|
||||
4. Begin API access coordination (email HEDD, GMC, NMC)
|
||||
5. Start recruiting beta partners this week
|
||||
|
||||
FOR ENGINEERING LEADS:
|
||||
1. Read PHASE1_TECHNICAL_IMPLEMENTATION.md (full - 40+ minutes)
|
||||
2. Read API_RESOURCES_AND_CONTACTS.md (full - 20+ minutes)
|
||||
3. Study the 4 code examples for each feature
|
||||
4. Set up development environment
|
||||
5. Plan sprint structure for 8-week delivery
|
||||
6. Identify any blockers or concerns
|
||||
7. Brief team on Phase 1 scope and timeline
|
||||
|
||||
FOR SALES/MARKETING:
|
||||
1. Read UK_MARKET_STRATEGY.md (full)
|
||||
2. Review Customer Personas section
|
||||
3. Review GTM Channels section
|
||||
4. Begin designing marketing materials
|
||||
5. Create sales talking points
|
||||
6. Prepare for "degree verification" messaging
|
||||
|
||||
================================================================================
|
||||
DOCUMENT LOCATIONS
|
||||
================================================================================
|
||||
|
||||
All files have been created in: /mnt/d/Git/TrueCV/
|
||||
|
||||
FILE STRUCTURE:
|
||||
/mnt/d/Git/TrueCV/QUICK_REFERENCE.md (Start here)
|
||||
/mnt/d/Git/TrueCV/EXECUTIVE_SUMMARY.md (Execs/investors)
|
||||
/mnt/d/Git/TrueCV/UK_FEATURE_PRIORITIZATION.md (Product)
|
||||
/mnt/d/Git/TrueCV/PHASE1_TECHNICAL_IMPLEMENTATION.md (Engineering)
|
||||
/mnt/d/Git/TrueCV/UK_MARKET_STRATEGY.md (Strategy/Sales/Marketing)
|
||||
/mnt/d/Git/TrueCV/API_RESOURCES_AND_CONTACTS.md (Implementation)
|
||||
/mnt/d/Git/TrueCV/README_UK_STRATEGY.md (Navigation)
|
||||
/mnt/d/Git/TrueCV/INDEX.md (Reference index)
|
||||
|
||||
FILES READY FOR USE IMMEDIATELY.
|
||||
|
||||
================================================================================
|
||||
FINAL RECOMMENDATIONS
|
||||
================================================================================
|
||||
|
||||
STRATEGIC DECISION:
|
||||
✓ STRONGLY RECOMMEND proceeding with Phase 1 immediately
|
||||
|
||||
RATIONALE:
|
||||
✓ Market gap is real and valuable (£3.3M addressable)
|
||||
✓ Competitive advantage is sustainable (6-12 month window)
|
||||
✓ Financial model is attractive (break-even in 6-7 months)
|
||||
✓ Technical feasibility is high (APIs accessible, proven patterns)
|
||||
✓ Team requirements are reasonable (2 engineers for 8 weeks)
|
||||
✓ Risk mitigation strategies are solid (fallbacks in place)
|
||||
|
||||
CRITICAL SUCCESS FACTORS:
|
||||
1. Secure HEDD API access (or verify scraper approach works)
|
||||
2. Recruit 3-5 beta partners committed to testing
|
||||
3. Maintain 8-week timeline (no scope creep)
|
||||
4. Achieve 500+ signups in first month (viral/organic growth)
|
||||
5. Monitor unit economics carefully (adjust pricing if needed)
|
||||
|
||||
NEXT DECISION POINT:
|
||||
Post-Phase 1 (Week 8): Should we proceed to Phase 2 (Q2) and Phase 3 (Q3)?
|
||||
- SUCCESS: Yes, proceed with professional bodies expansion
|
||||
- MODERATE: Yes, but revisit roadmap based on market feedback
|
||||
- WEAK: Pause, reassess market viability
|
||||
|
||||
================================================================================
|
||||
CONTACT INFORMATION
|
||||
================================================================================
|
||||
|
||||
STRATEGIC QUESTIONS:
|
||||
→ Product Leadership: [Assign contact]
|
||||
|
||||
MARKET ANALYSIS QUESTIONS:
|
||||
→ Marketing/Sales: [Assign contact]
|
||||
|
||||
TECHNICAL FEASIBILITY QUESTIONS:
|
||||
→ Engineering Lead: [Assign contact]
|
||||
|
||||
FINANCIAL MODEL QUESTIONS:
|
||||
→ Finance/CFO: [Assign contact]
|
||||
|
||||
================================================================================
|
||||
DOCUMENT VERSION & CONTROL
|
||||
================================================================================
|
||||
|
||||
VERSION: 1.0
|
||||
CREATED: January 20, 2026
|
||||
LAST UPDATED: January 20, 2026
|
||||
STATUS: READY FOR EXECUTION
|
||||
|
||||
DISTRIBUTION: Internal Only
|
||||
RECIPIENTS: Product, Engineering, Leadership
|
||||
|
||||
PLANNED UPDATES:
|
||||
- April 1, 2026: Post-Phase 1 launch retrospective
|
||||
- July 1, 2026: Post-Phase 2 launch update
|
||||
- October 1, 2026: Post-Phase 3 launch update
|
||||
- January 1, 2027: Year 1 retrospective + Year 2 planning
|
||||
|
||||
================================================================================
|
||||
CLOSING NOTES
|
||||
================================================================================
|
||||
|
||||
This strategy document represents a comprehensive analysis of TrueCV's
|
||||
opportunity in the UK CV verification market. It provides:
|
||||
|
||||
✓ Clear market opportunity quantification (£3.3M addressable)
|
||||
✓ Competitive advantage analysis (exclusive features)
|
||||
✓ Detailed technical implementation plans (production-ready code)
|
||||
✓ Go-to-market strategy (4 sales channels)
|
||||
✓ Financial projections (Year 1 break-even)
|
||||
✓ Risk mitigation (contingency plans)
|
||||
✓ 30-day action plan (immediate next steps)
|
||||
|
||||
The strategy is:
|
||||
✓ Data-driven (based on market research and API analysis)
|
||||
✓ Actionable (contains concrete implementation details)
|
||||
✓ Realistic (includes risk assessment and fallbacks)
|
||||
✓ Executable (fits within 8-week Phase 1 timeline)
|
||||
|
||||
Next step: **Leadership decision on Phase 1 go-ahead**
|
||||
|
||||
If approved, Phase 1 can launch by Week 2 of this plan.
|
||||
|
||||
================================================================================
|
||||
END OF DELIVERY SUMMARY
|
||||
================================================================================
|
||||
|
||||
Questions? Contact [Product Leadership]
|
||||
More details? See INDEX.md for document navigation
|
||||
Ready to execute? See 30-DAY ACTION PLAN above
|
||||
|
||||
@@ -1,447 +0,0 @@
|
||||
# TrueCV Production Deployment Guide
|
||||
|
||||
A low-budget guide to launching TrueCV as a professional, secure offering.
|
||||
|
||||
---
|
||||
|
||||
## Budget Summary
|
||||
|
||||
| Component | Monthly Cost | Notes |
|
||||
|-----------|-------------|-------|
|
||||
| Azure App Service (B1) | ~£10 | 1.75GB RAM, custom domain, SSL |
|
||||
| Azure SQL (Basic) | ~£4 | 2GB, 5 DTUs - upgrade as needed |
|
||||
| Azure Blob Storage | ~£1 | Pay per GB stored |
|
||||
| Domain name | ~£10/year | .com or .co.uk |
|
||||
| **Total** | **~£15-20/month** | Scales with usage |
|
||||
|
||||
Alternative: A single £5-10/month VPS (Hetzner, DigitalOcean) can run everything if you're comfortable with Linux administration.
|
||||
|
||||
---
|
||||
|
||||
## Phase 1: Pre-Launch Checklist
|
||||
|
||||
### 1.1 Stripe Setup (Required for Payments)
|
||||
|
||||
1. Create a Stripe account at [stripe.com](https://stripe.com)
|
||||
2. Complete business verification (required for live payments)
|
||||
3. Create two Products in Stripe Dashboard:
|
||||
- **Professional**: £49/month recurring
|
||||
- **Enterprise**: £199/month recurring
|
||||
4. Copy the Price IDs (start with `price_`) to your config
|
||||
5. Configure the Customer Portal:
|
||||
- Dashboard → Settings → Billing → Customer Portal
|
||||
- Enable: Update payment methods, Cancel subscriptions, View invoices
|
||||
6. Set up webhook endpoint (after deployment):
|
||||
- Dashboard → Developers → Webhooks → Add endpoint
|
||||
- URL: `https://yourdomain.com/api/stripe/webhook`
|
||||
- Events: `checkout.session.completed`, `customer.subscription.updated`, `customer.subscription.deleted`, `invoice.payment_failed`
|
||||
7. Copy the webhook signing secret to your config
|
||||
|
||||
### 1.2 External API Keys
|
||||
|
||||
| Service | Purpose | How to Get |
|
||||
|---------|---------|-----------|
|
||||
| Companies House | Company verification | [developer.company-information.service.gov.uk](https://developer.company-information.service.gov.uk) - Free |
|
||||
| Anthropic (Claude) | CV parsing & analysis | [console.anthropic.com](https://console.anthropic.com) - Pay per use |
|
||||
|
||||
### 1.3 Domain & Email
|
||||
|
||||
1. Register a domain (Cloudflare, Namecheap, or similar)
|
||||
2. Set up a professional email:
|
||||
- Budget option: Zoho Mail free tier (5 users)
|
||||
- Better option: Google Workspace (£5/user/month)
|
||||
3. Configure SPF, DKIM, DMARC records for email deliverability
|
||||
|
||||
---
|
||||
|
||||
## Phase 2: Infrastructure Setup
|
||||
|
||||
### Option A: Azure (Recommended for .NET)
|
||||
|
||||
#### App Service + Azure SQL
|
||||
|
||||
```bash
|
||||
# Install Azure CLI, then:
|
||||
az login
|
||||
|
||||
# Create resource group
|
||||
az group create --name truecv-prod --location uksouth
|
||||
|
||||
# Create App Service plan (B1 = ~£10/month)
|
||||
az appservice plan create \
|
||||
--name truecv-plan \
|
||||
--resource-group truecv-prod \
|
||||
--sku B1 \
|
||||
--is-linux
|
||||
|
||||
# Create web app
|
||||
az webapp create \
|
||||
--name truecv-app \
|
||||
--resource-group truecv-prod \
|
||||
--plan truecv-plan \
|
||||
--runtime "DOTNETCORE:8.0"
|
||||
|
||||
# Create SQL Server
|
||||
az sql server create \
|
||||
--name truecv-sql \
|
||||
--resource-group truecv-prod \
|
||||
--location uksouth \
|
||||
--admin-user truecvadmin \
|
||||
--admin-password <STRONG_PASSWORD>
|
||||
|
||||
# Create database (Basic = ~£4/month)
|
||||
az sql db create \
|
||||
--name truecv-db \
|
||||
--server truecv-sql \
|
||||
--resource-group truecv-prod \
|
||||
--service-objective Basic
|
||||
|
||||
# Create storage account for CV files
|
||||
az storage account create \
|
||||
--name truecvstorage \
|
||||
--resource-group truecv-prod \
|
||||
--location uksouth \
|
||||
--sku Standard_LRS
|
||||
```
|
||||
|
||||
#### Environment Variables (App Service Configuration)
|
||||
|
||||
Set these in Azure Portal → App Service → Configuration → Application settings:
|
||||
|
||||
```
|
||||
ConnectionStrings__DefaultConnection=Server=truecv-sql.database.windows.net;Database=truecv-db;User Id=truecvadmin;Password=<PASSWORD>;Encrypt=True;
|
||||
ConnectionStrings__HangfireConnection=<SAME_AS_ABOVE>
|
||||
Stripe__SecretKey=sk_live_xxx
|
||||
Stripe__PublishableKey=pk_live_xxx
|
||||
Stripe__WebhookSecret=whsec_xxx
|
||||
Stripe__PriceIds__Professional=price_xxx
|
||||
Stripe__PriceIds__Enterprise=price_xxx
|
||||
Anthropic__ApiKey=sk-ant-xxx
|
||||
CompaniesHouse__ApiKey=xxx
|
||||
AzureBlob__ConnectionString=<FROM_STORAGE_ACCOUNT>
|
||||
AzureBlob__ContainerName=cvfiles
|
||||
```
|
||||
|
||||
### Option B: VPS (Budget Alternative)
|
||||
|
||||
A £5-10/month VPS from Hetzner, DigitalOcean, or Vultr can run everything:
|
||||
|
||||
1. Ubuntu 22.04 LTS
|
||||
2. Install Docker and Docker Compose
|
||||
3. Use the existing `docker-compose.yml` with modifications:
|
||||
|
||||
```yaml
|
||||
# docker-compose.prod.yml
|
||||
version: '3.8'
|
||||
services:
|
||||
web:
|
||||
build: .
|
||||
ports:
|
||||
- "5000:8080"
|
||||
environment:
|
||||
- ASPNETCORE_ENVIRONMENT=Production
|
||||
- ConnectionStrings__DefaultConnection=Server=db;Database=TrueCV;User Id=sa;Password=${DB_PASSWORD};TrustServerCertificate=True
|
||||
depends_on:
|
||||
- db
|
||||
restart: always
|
||||
|
||||
db:
|
||||
image: mcr.microsoft.com/mssql/server:2022-latest
|
||||
environment:
|
||||
- ACCEPT_EULA=Y
|
||||
- SA_PASSWORD=${DB_PASSWORD}
|
||||
volumes:
|
||||
- sqldata:/var/opt/mssql
|
||||
restart: always
|
||||
|
||||
caddy: # Reverse proxy with automatic HTTPS
|
||||
image: caddy:2
|
||||
ports:
|
||||
- "80:80"
|
||||
- "443:443"
|
||||
volumes:
|
||||
- ./Caddyfile:/etc/caddy/Caddyfile
|
||||
- caddy_data:/data
|
||||
restart: always
|
||||
|
||||
volumes:
|
||||
sqldata:
|
||||
caddy_data:
|
||||
```
|
||||
|
||||
```
|
||||
# Caddyfile
|
||||
yourdomain.com {
|
||||
reverse_proxy web:5000
|
||||
}
|
||||
```
|
||||
|
||||
---
|
||||
|
||||
## Phase 3: Security Hardening
|
||||
|
||||
### 3.1 Application Security (Critical)
|
||||
|
||||
#### Secrets Management
|
||||
- **Never** commit secrets to git
|
||||
- Use Azure Key Vault or environment variables
|
||||
- Rotate API keys quarterly
|
||||
|
||||
#### HTTPS Enforcement
|
||||
Already configured in `Program.cs`:
|
||||
```csharp
|
||||
app.UseHsts();
|
||||
app.UseHttpsRedirection();
|
||||
```
|
||||
|
||||
#### Content Security Policy
|
||||
Add to `Program.cs`:
|
||||
```csharp
|
||||
app.Use(async (context, next) =>
|
||||
{
|
||||
context.Response.Headers.Append("X-Content-Type-Options", "nosniff");
|
||||
context.Response.Headers.Append("X-Frame-Options", "DENY");
|
||||
context.Response.Headers.Append("X-XSS-Protection", "1; mode=block");
|
||||
context.Response.Headers.Append("Referrer-Policy", "strict-origin-when-cross-origin");
|
||||
context.Response.Headers.Append("Permissions-Policy", "camera=(), microphone=(), geolocation=()");
|
||||
await next();
|
||||
});
|
||||
```
|
||||
|
||||
#### Rate Limiting
|
||||
Add to `Program.cs`:
|
||||
```csharp
|
||||
builder.Services.AddRateLimiter(options =>
|
||||
{
|
||||
options.GlobalLimiter = PartitionedRateLimiter.Create<HttpContext, string>(context =>
|
||||
RateLimitPartition.GetFixedWindowLimiter(
|
||||
partitionKey: context.User.Identity?.Name ?? context.Request.Headers.Host.ToString(),
|
||||
factory: _ => new FixedWindowRateLimiterOptions
|
||||
{
|
||||
AutoReplenishment = true,
|
||||
PermitLimit = 100,
|
||||
Window = TimeSpan.FromMinutes(1)
|
||||
}));
|
||||
});
|
||||
|
||||
// In middleware pipeline
|
||||
app.UseRateLimiter();
|
||||
```
|
||||
|
||||
### 3.2 Database Security
|
||||
|
||||
1. **Use strong passwords** (20+ characters, random)
|
||||
2. **Enable Azure SQL firewall** - allow only App Service IP
|
||||
3. **Enable Transparent Data Encryption** (on by default in Azure)
|
||||
4. **Regular backups** - Azure does this automatically (7-day retention on Basic tier)
|
||||
|
||||
### 3.3 File Storage Security
|
||||
|
||||
CV files contain sensitive data:
|
||||
|
||||
1. **Private container** - never allow public blob access
|
||||
2. **SAS tokens** - generate time-limited URLs for downloads
|
||||
3. **Encryption at rest** - enabled by default in Azure Storage
|
||||
4. **Consider encryption at application level** for extra protection
|
||||
|
||||
### 3.4 Authentication Security
|
||||
|
||||
Already using ASP.NET Identity with good defaults. Verify these settings:
|
||||
|
||||
```csharp
|
||||
// In Program.cs - identity configuration
|
||||
builder.Services.Configure<IdentityOptions>(options =>
|
||||
{
|
||||
options.Password.RequiredLength = 12;
|
||||
options.Password.RequireDigit = true;
|
||||
options.Password.RequireLowercase = true;
|
||||
options.Password.RequireUppercase = true;
|
||||
options.Password.RequireNonAlphanumeric = true;
|
||||
options.Lockout.DefaultLockoutTimeSpan = TimeSpan.FromMinutes(15);
|
||||
options.Lockout.MaxFailedAccessAttempts = 5;
|
||||
});
|
||||
```
|
||||
|
||||
### 3.5 Stripe Webhook Security
|
||||
|
||||
Already implemented - verify signature on every webhook:
|
||||
```csharp
|
||||
// In StripeService.cs - this is critical
|
||||
stripeEvent = EventUtility.ConstructEvent(json, signature, _settings.WebhookSecret);
|
||||
```
|
||||
|
||||
---
|
||||
|
||||
## Phase 4: Compliance & Legal
|
||||
|
||||
### 4.1 GDPR Compliance (Required for UK/EU)
|
||||
|
||||
1. **Privacy Policy** - create and link in footer
|
||||
- What data you collect (CVs, email, payment info)
|
||||
- How long you retain it
|
||||
- User rights (access, deletion, portability)
|
||||
- Third parties (Stripe, Anthropic, Companies House)
|
||||
|
||||
2. **Cookie Consent** - add banner for analytics cookies
|
||||
|
||||
3. **Data Retention Policy**:
|
||||
- CVs: Delete after 30 days or on user request
|
||||
- Accounts: Retain while active, delete 90 days after closure
|
||||
- Payment data: Stripe handles this (PCI compliant)
|
||||
|
||||
4. **Right to Deletion** - implement account deletion feature
|
||||
|
||||
5. **Data Processing Agreement** - required if you have business customers
|
||||
|
||||
### 4.2 Terms of Service
|
||||
|
||||
Cover:
|
||||
- Service description and limitations
|
||||
- Acceptable use policy
|
||||
- Payment terms and refund policy
|
||||
- Liability limitations
|
||||
- Dispute resolution
|
||||
|
||||
### 4.3 PCI Compliance
|
||||
|
||||
Stripe Checkout handles card data - you never touch it. This puts you in **PCI SAQ-A** (simplest level):
|
||||
- Use only Stripe Checkout or Elements
|
||||
- Serve pages over HTTPS
|
||||
- Don't store card numbers
|
||||
|
||||
---
|
||||
|
||||
## Phase 5: Monitoring & Operations
|
||||
|
||||
### 5.1 Application Monitoring
|
||||
|
||||
#### Free Option: Application Insights (Azure)
|
||||
```csharp
|
||||
// In Program.cs
|
||||
builder.Services.AddApplicationInsightsTelemetry();
|
||||
```
|
||||
|
||||
#### Budget Option: Seq + Serilog
|
||||
```csharp
|
||||
// Already using Serilog - add Seq sink
|
||||
Log.Logger = new LoggerConfiguration()
|
||||
.WriteTo.Seq("http://localhost:5341") // Self-hosted Seq
|
||||
.CreateLogger();
|
||||
```
|
||||
|
||||
### 5.2 Uptime Monitoring
|
||||
|
||||
Free options:
|
||||
- [UptimeRobot](https://uptimerobot.com) - 50 free monitors
|
||||
- [Freshping](https://freshping.io) - 50 free monitors
|
||||
|
||||
Set up alerts for:
|
||||
- Homepage availability
|
||||
- API health endpoint
|
||||
- Webhook endpoint
|
||||
|
||||
### 5.3 Error Tracking
|
||||
|
||||
Add a health check endpoint:
|
||||
```csharp
|
||||
// In Program.cs
|
||||
app.MapGet("/health", () => Results.Ok(new { status = "healthy", timestamp = DateTime.UtcNow }));
|
||||
```
|
||||
|
||||
### 5.4 Backup Strategy
|
||||
|
||||
| Component | Backup Method | Frequency |
|
||||
|-----------|--------------|-----------|
|
||||
| Database | Azure automated backups | Continuous (7-day retention) |
|
||||
| CV files | Azure Blob redundancy (LRS) | Automatic |
|
||||
| Config | Git repository | On change |
|
||||
|
||||
For VPS: Set up daily database dumps to offsite storage.
|
||||
|
||||
---
|
||||
|
||||
## Phase 6: Launch Checklist
|
||||
|
||||
### Pre-Launch (1 week before)
|
||||
|
||||
- [ ] All environment variables configured
|
||||
- [ ] Database migrations applied
|
||||
- [ ] Stripe products created and tested
|
||||
- [ ] Webhook endpoint configured and tested
|
||||
- [ ] SSL certificate active
|
||||
- [ ] Privacy Policy and Terms published
|
||||
- [ ] Test complete user journey (signup → payment → CV check)
|
||||
- [ ] Test subscription cancellation flow
|
||||
- [ ] Error pages customised (404, 500)
|
||||
|
||||
### Launch Day
|
||||
|
||||
- [ ] Switch Stripe to live mode (change API keys)
|
||||
- [ ] Verify webhook is receiving live events
|
||||
- [ ] Monitor error logs closely
|
||||
- [ ] Test a real payment (refund yourself)
|
||||
|
||||
### Post-Launch (First Week)
|
||||
|
||||
- [ ] Monitor for errors daily
|
||||
- [ ] Check Stripe dashboard for failed payments
|
||||
- [ ] Respond to support queries within 24 hours
|
||||
- [ ] Gather user feedback
|
||||
|
||||
---
|
||||
|
||||
## Phase 7: Scaling (When Needed)
|
||||
|
||||
Start small and scale based on actual usage:
|
||||
|
||||
| Trigger | Action | Cost Impact |
|
||||
|---------|--------|-------------|
|
||||
| Response time > 2s | Upgrade App Service to B2/B3 | +£10-30/month |
|
||||
| Database DTU > 80% | Upgrade to Standard S0 | +£15/month |
|
||||
| Storage > 5GB | Already pay-per-use | Minimal |
|
||||
| > 1000 users | Add Redis for caching | +£15/month |
|
||||
|
||||
---
|
||||
|
||||
## Quick Reference: Configuration Files
|
||||
|
||||
### appsettings.Production.json
|
||||
```json
|
||||
{
|
||||
"Logging": {
|
||||
"LogLevel": {
|
||||
"Default": "Warning",
|
||||
"Microsoft.AspNetCore": "Warning"
|
||||
}
|
||||
},
|
||||
"AllowedHosts": "yourdomain.com;www.yourdomain.com"
|
||||
}
|
||||
```
|
||||
|
||||
Sensitive values should be in environment variables, not this file.
|
||||
|
||||
---
|
||||
|
||||
## Support & Resources
|
||||
|
||||
- [Azure App Service Docs](https://learn.microsoft.com/en-us/azure/app-service/)
|
||||
- [Stripe Documentation](https://stripe.com/docs)
|
||||
- [ASP.NET Core Security](https://learn.microsoft.com/en-us/aspnet/core/security/)
|
||||
- [OWASP Top 10](https://owasp.org/www-project-top-ten/)
|
||||
|
||||
---
|
||||
|
||||
## Estimated Time to Launch
|
||||
|
||||
| Phase | Effort |
|
||||
|-------|--------|
|
||||
| Stripe setup | 1-2 hours |
|
||||
| Infrastructure | 2-4 hours |
|
||||
| Security hardening | 2-3 hours |
|
||||
| Legal pages | 2-4 hours (use templates) |
|
||||
| Testing | 2-4 hours |
|
||||
| **Total** | **1-2 days** |
|
||||
|
||||
---
|
||||
|
||||
*Document version: 1.0 | Last updated: January 2026*
|
||||
@@ -1,236 +0,0 @@
|
||||
# TrueCV UK Market Opportunity - Executive Summary
|
||||
|
||||
**Prepared for:** Product Leadership
|
||||
**Date:** January 2026
|
||||
**Priority:** High - Q1 2026 Implementation Opportunity
|
||||
|
||||
---
|
||||
|
||||
## The Opportunity
|
||||
|
||||
**UK CV fraud costs employers £4.2B annually. Current verification takes 5-10 days. TrueCV can do it in seconds.**
|
||||
|
||||
### Market Problem
|
||||
- **1 in 5 UK candidates** falsify university degrees
|
||||
- **24% of screened CVs** fail verification checks
|
||||
- **40% of CV lies** involve qualification exaggeration
|
||||
- **Regulatory risk:** Companies face legal liability in healthcare, finance, legal sectors
|
||||
- **AI-accelerated fraud:** Deepfakes and synthetic identities emerging in 2026
|
||||
|
||||
### Current Solution Gaps
|
||||
- Education verification requires contacting universities individually (10+ days per candidate)
|
||||
- Professional registration checks vary by profession with no central API
|
||||
- No integrated view connecting employment, education, and professional credentials
|
||||
- Manual processes don't scale for high-volume recruiters
|
||||
|
||||
---
|
||||
|
||||
## TrueCV's Solution
|
||||
|
||||
**Integrated CV verification platform leveraging UK-specific data sources:**
|
||||
|
||||
| Feature | Coverage | Implementation | Impact |
|
||||
|---|---|---|---|
|
||||
| **HEDD Degree Verification** | UK degrees (140+ universities) | Q1 2026 (2-3 weeks) | Detects 90%+ of fake degrees |
|
||||
| **Healthcare Registers** (GMC/NMC) | Doctors, nurses, midwives | Q1 2026 (1 week) | Dominates healthcare niche |
|
||||
| **Timeline Fraud Detection** | Employment/education overlaps, gaps | Q1 2026 (1 week) | Catches 80%+ of timeline lies |
|
||||
| **Company Director Verification** | Self-employment claims (Companies House) | Q1 2026 (1-2 weeks) | Validates 15-20% of CVs |
|
||||
| **Professional Bodies** | ICAEW, SRA, IET, RIBA | Q2 2026 (4 weeks) | Expands to regulated professions |
|
||||
| **DBS Integration** | Criminal record checks | Q3 2026 (8 weeks) | Compliance + revenue stream |
|
||||
|
||||
---
|
||||
|
||||
## Competitive Advantage
|
||||
|
||||
**TrueCV is the ONLY CV verification tool that:**
|
||||
|
||||
1. ✅ Integrates with HEDD (no competitors do)
|
||||
2. ✅ Targets healthcare recruiting niche (GMC/NMC)
|
||||
3. ✅ Verifies director claims (Companies House cross-check)
|
||||
4. ✅ Detects timeline fraud across education-employment boundary
|
||||
5. ✅ UK-first approach vs. global platforms
|
||||
|
||||
**Nearest competitors** (Workable, Deel, Checkr) focus on broad background screening, not CV verification.
|
||||
|
||||
---
|
||||
|
||||
## Market Size
|
||||
|
||||
### Addressable Market
|
||||
- **18,300 potential customers** (recruitment agencies + corporate HR)
|
||||
- **£2.8B UK pre-employment screening market**
|
||||
- **~£3.3M serviceable opportunity** for TrueCV platform
|
||||
|
||||
### Year 1 Revenue Target
|
||||
- **50-75 paying customers** at £49-199/month
|
||||
- **£30-240K revenue** Year 1 (conservative-growth scenario)
|
||||
- **£113K-226K annualized** by end of Year 1
|
||||
|
||||
### Unit Economics
|
||||
- **CAC:** £150-300 (organic/partner-led)
|
||||
- **ARPU:** £60-120/month
|
||||
- **Payback:** 2-4 months
|
||||
- **Gross margin:** 75-80%
|
||||
|
||||
---
|
||||
|
||||
## Implementation Plan
|
||||
|
||||
### Phase 1: MVP (Q1 2026 - 8 weeks)
|
||||
**Deliverables:**
|
||||
1. HEDD degree verification (real-time + manual review tracking)
|
||||
2. GMC/NMC healthcare register checks
|
||||
3. Enhanced timeline analysis (education/employment sequencing)
|
||||
4. Companies House director verification
|
||||
5. Public beta launch
|
||||
|
||||
**Team:** 2 backend engineers, 1 QA, 1 PM, 1 marketing
|
||||
|
||||
**Go-to-Market:** Beta with 3-5 recruitment agencies → Public launch → Press/analyst outreach
|
||||
|
||||
**Success Metrics:**
|
||||
- 500+ signups in first month
|
||||
- 10%+ weekly active check rate
|
||||
- 85%+ feature satisfaction
|
||||
|
||||
### Phase 2: Professional Bodies (Q2 2026)
|
||||
- ICAEW, SRA, IET, RIBA integration
|
||||
- Vertical market expansion
|
||||
- +40% user growth
|
||||
- +3x engagement
|
||||
|
||||
### Phase 3: Compliance & Regulatory (Q3 2026)
|
||||
- HMRC payroll verification
|
||||
- DBS check integration (partnership)
|
||||
- Enterprise/platform tier
|
||||
- Recurring revenue + commission model
|
||||
|
||||
---
|
||||
|
||||
## Key Dependencies & Risks
|
||||
|
||||
### Critical Path Items
|
||||
1. ✅ **HEDD API Access** - Start conversations NOW
|
||||
- Fallback: Web portal integration (still works)
|
||||
- Timeline: Approval expected 2-4 weeks
|
||||
|
||||
2. ✅ **GMC/NMC Verification** - Request official API access
|
||||
- Fallback: Web scraper (more fragile)
|
||||
- Timeline: Scraper approach = 1 week dev
|
||||
|
||||
3. ✅ **Companies House API** - Already have access
|
||||
- Enhancement to existing client = 1-2 weeks
|
||||
|
||||
### Risks & Mitigations
|
||||
|
||||
| Risk | Probability | Mitigation |
|
||||
|---|---|---|
|
||||
| HEDD API delayed | Medium | Use web portal integration in parallel |
|
||||
| GMC/NMC scraper blocked | Low | Request official API; provide value-add |
|
||||
| Slow market adoption | Medium | Focus vertically (healthcare first) |
|
||||
| Regulatory gatekeeping | Medium | Partner with established vendors early |
|
||||
|
||||
---
|
||||
|
||||
## Financial Projections
|
||||
|
||||
### Conservative Scenario (50 customers)
|
||||
- **MRR (end-of-year):** £9,455
|
||||
- **Annualized:** £113,460
|
||||
- **Costs:** £220K/year
|
||||
- **Result:** Approaching break-even
|
||||
|
||||
### Growth Scenario (100 customers)
|
||||
- **MRR (end-of-year):** £18,910
|
||||
- **Annualized:** £226,920
|
||||
- **Gross margin:** 75% = £170K+ operational profit
|
||||
- **Result:** Profitable by month 9
|
||||
|
||||
### Break-even Point
|
||||
- **Customers needed:** 24-30 at blended ARPU of £80/month
|
||||
- **Timeline:** Expected by month 6-7
|
||||
|
||||
---
|
||||
|
||||
## Why Now?
|
||||
|
||||
1. **Market Conditions Perfect:**
|
||||
- UK CV fraud peaking (1 in 5 have fake degrees)
|
||||
- AI-generated fraud emerging (accelerating urgency)
|
||||
- HEDD now mature platform (140+ universities on network)
|
||||
- GMC/NMC registers fully digital (scraping viable)
|
||||
|
||||
2. **No Competitive Threat:**
|
||||
- Workable/Deel don't focus on CV verification
|
||||
- Checkr/Verifile are manual processes
|
||||
- No integrated UK player in market
|
||||
|
||||
3. **Technical Feasibility:**
|
||||
- HEDD integration straightforward
|
||||
- Scraper patterns proven (NHS, Companies House)
|
||||
- Timeline analysis already implemented
|
||||
|
||||
---
|
||||
|
||||
## Recommendation
|
||||
|
||||
**PROCEED with Phase 1 implementation immediately.**
|
||||
|
||||
### Next 30 Days
|
||||
- [ ] Secure HEDD API access (contact Prospects/Jisc)
|
||||
- [ ] Recruit 3-5 beta partner agencies
|
||||
- [ ] Begin HEDD client development (Day 1)
|
||||
- [ ] Finalize consent/compliance workflows
|
||||
|
||||
### Success Metrics (Month 1)
|
||||
- HEDD integration code complete
|
||||
- 3+ beta partners onboarded
|
||||
- Timeline analysis enhanced
|
||||
- Public beta announcement scheduled
|
||||
|
||||
### Decision Gate (Month 2)
|
||||
- Evaluate adoption rate (target: 100+ signups)
|
||||
- Assess feature-market fit with agencies
|
||||
- Validate revenue model (pricing feedback)
|
||||
- Proceed to Phase 2 if metrics green
|
||||
|
||||
---
|
||||
|
||||
## Appendix: Detailed Feature Priorities
|
||||
|
||||
### Ranked by: Detection Value × Implementation Feasibility
|
||||
|
||||
**TIER 1 (Start immediately):**
|
||||
1. HEDD Degree Verification - 9.5/10 impact, medium effort
|
||||
2. Timeline Fraud Detection - 7/10 impact, low effort (extending existing)
|
||||
3. GMC/NMC Healthcare Registers - 6.5/10 impact, low effort
|
||||
|
||||
**TIER 2 (Weeks 3-5):**
|
||||
4. Companies House Director Verification - 7.5/10 impact, low effort (extending existing)
|
||||
|
||||
**TIER 3 (Q2):**
|
||||
5. Professional Body Registers - 6.5-7/10 impact, medium effort
|
||||
6. GOV.UK Regulated Professions Enrichment - 5/10 impact, very low effort
|
||||
|
||||
**TIER 4 (Q3+):**
|
||||
7. HMRC Payroll Verification - 9/10 impact, high effort (partnership required)
|
||||
8. DBS Integration - 8.5/10 impact, high effort (partnership + compliance)
|
||||
|
||||
---
|
||||
|
||||
## Questions for Stakeholders
|
||||
|
||||
1. **Timeline:** Can we commit 2 engineers full-time for 8 weeks?
|
||||
2. **HEDD Access:** Will you sponsor approach to HEDD/Prospects for API partnership?
|
||||
3. **Beta Partners:** Do we have recruitment agency relationships for beta testing?
|
||||
4. **Revenue Model:** Approve tiered pricing (Free/Pro/Enterprise)?
|
||||
5. **International:** After UK success, expand to Ireland/Australia?
|
||||
|
||||
---
|
||||
|
||||
## Contact & Next Steps
|
||||
|
||||
**Product Lead:** [Name] - TrueCV Product Strategy
|
||||
**Engineering Lead:** [Name] - Phase 1 Technical Implementation
|
||||
|
||||
**Next Meeting:** [Date] - Review technical implementation plan + finalize go-to-market
|
||||
|
Before Width: | Height: | Size: 6.3 MiB |
492
INDEX.md
@@ -1,492 +0,0 @@
|
||||
# TrueCV UK Strategy - Complete Document Index
|
||||
|
||||
**Total Documents:** 6 comprehensive strategy guides
|
||||
**Total Pages:** ~200 pages
|
||||
**Total Read Time:** 2-3 hours (depending on role)
|
||||
|
||||
---
|
||||
|
||||
## Document Inventory
|
||||
|
||||
### 1. **QUICK_REFERENCE.md** ⭐ START HERE (5 minutes)
|
||||
**Size:** 3 pages
|
||||
**Format:** Quick-reference card format
|
||||
**Best For:** All audiences - desk reference
|
||||
**Contains:**
|
||||
- Market opportunity summary
|
||||
- Competitive advantage matrix
|
||||
- Phase 1 timeline (visual)
|
||||
- Feature ranking (visual)
|
||||
- API status table
|
||||
- Pricing strategy
|
||||
- Success metrics
|
||||
- Fraud detection coverage
|
||||
- 30-day action plan
|
||||
- Team requirements
|
||||
- Risk dashboard
|
||||
- Customer personas (condensed)
|
||||
- Sales channels
|
||||
- Decision framework
|
||||
- Key contacts
|
||||
|
||||
**Action Items:** Print this for your desk during planning
|
||||
|
||||
---
|
||||
|
||||
### 2. **EXECUTIVE_SUMMARY.md** (5-10 minutes)
|
||||
**Size:** 5 pages
|
||||
**Format:** Executive brief
|
||||
**Best For:** Executives, Investors, Decision-makers
|
||||
**Contains:**
|
||||
- Market opportunity (£4.2B fraud cost)
|
||||
- Problem statement
|
||||
- Solution overview (4 features)
|
||||
- Competitive advantage
|
||||
- Market size & revenue targets
|
||||
- Implementation plan (3 phases)
|
||||
- Key dependencies & risks
|
||||
- Financial projections (2 scenarios)
|
||||
- Why now analysis
|
||||
- Recommendation
|
||||
- Appendix with detailed feature priorities
|
||||
|
||||
**Next Document:** UK_MARKET_STRATEGY.md (for GTM details)
|
||||
|
||||
---
|
||||
|
||||
### 3. **UK_FEATURE_PRIORITIZATION.md** (20-30 minutes)
|
||||
**Size:** 25-30 pages
|
||||
**Format:** Detailed technical analysis
|
||||
**Best For:** Product Managers, Engineering Leads
|
||||
**Contains:**
|
||||
- Executive summary
|
||||
- Market context (fraud patterns & statistics)
|
||||
- Available UK data sources (detailed analysis of 8 APIs)
|
||||
- Ranked feature prioritization (matrix format)
|
||||
- Recommended implementation roadmap (3 phases)
|
||||
- Feature implementation examples (code pseudocode)
|
||||
- Success metrics per feature
|
||||
- Risk mitigation strategies
|
||||
- UK market positioning statement
|
||||
- API accessibility summary table
|
||||
- Next steps (this week actions)
|
||||
|
||||
**Key Section:** "Ranked Feature Prioritization" (clear action priorities)
|
||||
|
||||
---
|
||||
|
||||
### 4. **PHASE1_TECHNICAL_IMPLEMENTATION.md** (40-50 minutes)
|
||||
**Size:** 50-60 pages
|
||||
**Format:** Complete technical specification + code
|
||||
**Best For:** Backend Engineers, QA Engineers
|
||||
**Contains:**
|
||||
- Phase 1 overview (8-week timeline)
|
||||
- Feature 1: HEDD Integration (complete implementation)
|
||||
- Architecture diagram
|
||||
- 5 complete C# files (interfaces, services, models)
|
||||
- Configuration examples
|
||||
- Database considerations
|
||||
- Feature 2: Enhanced Timeline Analysis (code example)
|
||||
- Feature 3: Companies House Director Verification (code example)
|
||||
- Feature 4: Healthcare Register Scrapers (code example)
|
||||
- Dependency injection setup
|
||||
- Integration examples
|
||||
- Testing strategy
|
||||
- Configuration checklist
|
||||
- Database migration guide
|
||||
- Validation checklist
|
||||
|
||||
**Most Valuable:** "Phase 1a-1g" sections with production-ready code
|
||||
|
||||
---
|
||||
|
||||
### 5. **UK_MARKET_STRATEGY.md** (30-40 minutes)
|
||||
**Size:** 40-50 pages
|
||||
**Format:** Comprehensive market strategy document
|
||||
**Best For:** Product Team, Marketing, Sales, Leadership
|
||||
**Contains:**
|
||||
- Market opportunity analysis
|
||||
- Problem statement (detailed)
|
||||
- Market sizing (TAM/SAM/SOM)
|
||||
- Competitive landscape (8 competitors analyzed)
|
||||
- Product strategy (3 phases)
|
||||
- Go-to-market strategy (4 sales channels)
|
||||
- Pricing strategy (tier analysis + unit economics)
|
||||
- Organizational requirements (team structure over 12 months)
|
||||
- Key risks & mitigations
|
||||
- 12-month success metrics
|
||||
- Financial projections (conservative + growth scenarios)
|
||||
- Next 30 days action plan
|
||||
- Long-term vision (2-3 years, international expansion)
|
||||
- Customer personas (3 detailed profiles)
|
||||
- References & data sources
|
||||
|
||||
**Most Valuable:** Financials section + Customer personas
|
||||
|
||||
---
|
||||
|
||||
### 6. **API_RESOURCES_AND_CONTACTS.md** (20-30 minutes)
|
||||
**Size:** 20-25 pages
|
||||
**Format:** Practical implementation guide
|
||||
**Best For:** Engineering + Product (implementation phase)
|
||||
**Contains:**
|
||||
- Detailed guide for 11 UK APIs
|
||||
- HEDD (degree verification)
|
||||
- GMC Register (doctors)
|
||||
- NMC Register (nurses)
|
||||
- Companies House (already integrated)
|
||||
- GOV.UK Regulated Professions
|
||||
- ICAEW (accountants)
|
||||
- SRA (lawyers)
|
||||
- IET (engineers)
|
||||
- HCPC (health professionals)
|
||||
- DBS Integration (partnership model)
|
||||
- HMRC Payroll (restricted access)
|
||||
- For each API:
|
||||
- Overview & coverage
|
||||
- Access information
|
||||
- Contact details
|
||||
- Integration methods (API vs. scraper)
|
||||
- Required registration info
|
||||
- Timeline for access
|
||||
- Documentation links
|
||||
- Implementation prioritization table
|
||||
- Compliance & data protection checklist
|
||||
- Email template for API requests
|
||||
- Contact information for vendors
|
||||
|
||||
**Most Valuable:** For getting API access - everything you need to know
|
||||
|
||||
---
|
||||
|
||||
### 7. **README_UK_STRATEGY.md** (5-10 minutes)
|
||||
**Size:** 8-10 pages
|
||||
**Format:** Navigation guide + executive summary
|
||||
**Best For:** Navigation & orientation for all audiences
|
||||
**Contains:**
|
||||
- Document hierarchy
|
||||
- Quick navigation by role
|
||||
- Key metrics at a glance
|
||||
- Fraud detection coverage
|
||||
- Competitive moat explanation
|
||||
- Critical path dependencies
|
||||
- Financial summary
|
||||
- Risk mitigation
|
||||
- 30-day plan (high-level)
|
||||
- Recommended reading order
|
||||
- Questions & decision points
|
||||
- Success criteria
|
||||
- File manifest
|
||||
- Version history
|
||||
- Key definitions & terminology
|
||||
- License & confidentiality notice
|
||||
|
||||
**Most Valuable:** Orientation + role-based reading paths
|
||||
|
||||
---
|
||||
|
||||
## Role-Based Reading Guide
|
||||
|
||||
### For Executives (20-30 minutes total)
|
||||
1. **QUICK_REFERENCE.md** (5 min) - Print & keep at desk
|
||||
2. **EXECUTIVE_SUMMARY.md** (10 min) - Full read
|
||||
3. **UK_MARKET_STRATEGY.md** (10 min) - Market Opportunity + Financials sections only
|
||||
4. **Decision:** Approve Phase 1 go-ahead?
|
||||
|
||||
---
|
||||
|
||||
### For Product Managers (90 minutes total)
|
||||
1. **QUICK_REFERENCE.md** (5 min) - Orientation
|
||||
2. **EXECUTIVE_SUMMARY.md** (10 min) - Full read
|
||||
3. **UK_FEATURE_PRIORITIZATION.md** (35 min) - Full read (PRIORITY)
|
||||
4. **UK_MARKET_STRATEGY.md** (25 min) - GTM + Personas sections
|
||||
5. **API_RESOURCES_AND_CONTACTS.md** (10 min) - Skim for reference
|
||||
6. **PHASE1_TECHNICAL_IMPLEMENTATION.md** (5 min) - Skim architecture section only
|
||||
|
||||
---
|
||||
|
||||
### For Backend Engineers (2 hours total)
|
||||
1. **QUICK_REFERENCE.md** (5 min) - Context
|
||||
2. **EXECUTIVE_SUMMARY.md** (5 min) - Skim only
|
||||
3. **PHASE1_TECHNICAL_IMPLEMENTATION.md** (70 min) - FULL READ + study code
|
||||
4. **API_RESOURCES_AND_CONTACTS.md** (30 min) - FULL READ + bookmark sections
|
||||
5. **UK_FEATURE_PRIORITIZATION.md** (10 min) - Implementation examples section
|
||||
|
||||
---
|
||||
|
||||
### For QA Engineers (60 minutes total)
|
||||
1. **QUICK_REFERENCE.md** (5 min)
|
||||
2. **EXECUTIVE_SUMMARY.md** (5 min)
|
||||
3. **UK_FEATURE_PRIORITIZATION.md** (20 min) - Success metrics section
|
||||
4. **PHASE1_TECHNICAL_IMPLEMENTATION.md** (30 min) - Testing & validation sections
|
||||
|
||||
---
|
||||
|
||||
### For Sales/Marketing (60 minutes total)
|
||||
1. **QUICK_REFERENCE.md** (5 min) - Print one
|
||||
2. **EXECUTIVE_SUMMARY.md** (10 min)
|
||||
3. **UK_MARKET_STRATEGY.md** (35 min) - GTM Strategy + Customer Personas + Messaging
|
||||
4. **API_RESOURCES_AND_CONTACTS.md** (5 min) - Quick skim
|
||||
|
||||
---
|
||||
|
||||
### For Investors/Analysts (45 minutes total)
|
||||
1. **EXECUTIVE_SUMMARY.md** (10 min) - FULL READ
|
||||
2. **UK_MARKET_STRATEGY.md** (30 min) - Market Opportunity, Financials, Competitive Landscape sections
|
||||
3. **QUICK_REFERENCE.md** (5 min) - Risk dashboard
|
||||
|
||||
---
|
||||
|
||||
## Document Cross-References
|
||||
|
||||
### How to Find Information About...
|
||||
|
||||
**HEDD Integration:**
|
||||
- Quick overview → QUICK_REFERENCE.md (API Integration Status table)
|
||||
- Strategic importance → EXECUTIVE_SUMMARY.md
|
||||
- Detailed analysis → UK_FEATURE_PRIORITIZATION.md (Section: "HEDD Degree Verification")
|
||||
- Technical implementation → PHASE1_TECHNICAL_IMPLEMENTATION.md (Feature 1)
|
||||
- How to get access → API_RESOURCES_AND_CONTACTS.md (Section 1)
|
||||
|
||||
**Market Opportunity:**
|
||||
- Quick version → QUICK_REFERENCE.md (Market Opportunity section)
|
||||
- Detailed analysis → EXECUTIVE_SUMMARY.md (full document)
|
||||
- Go-to-market strategy → UK_MARKET_STRATEGY.md (full document)
|
||||
- Customer research → UK_MARKET_STRATEGY.md (Customer Personas)
|
||||
|
||||
**Financial Projections:**
|
||||
- Quick reference → QUICK_REFERENCE.md (Financial Projections)
|
||||
- Conservative scenario → EXECUTIVE_SUMMARY.md
|
||||
- Detailed projections → UK_MARKET_STRATEGY.md (Financial Projections section)
|
||||
- Unit economics → UK_MARKET_STRATEGY.md (Pricing Strategy)
|
||||
|
||||
**Timeline & Roadmap:**
|
||||
- Quick version → QUICK_REFERENCE.md (Phase 1 Roadmap)
|
||||
- Executive summary → EXECUTIVE_SUMMARY.md (Implementation Plan)
|
||||
- Detailed roadmap → UK_MARKET_STRATEGY.md (3-phase strategy)
|
||||
- Technical details → PHASE1_TECHNICAL_IMPLEMENTATION.md (entire document)
|
||||
|
||||
**Competitive Advantage:**
|
||||
- Matrix format → QUICK_REFERENCE.md (Competitive Advantage)
|
||||
- Analysis → EXECUTIVE_SUMMARY.md (Why Now section)
|
||||
- Detailed analysis → UK_MARKET_STRATEGY.md (Competitive Landscape)
|
||||
- Moat explanation → README_UK_STRATEGY.md
|
||||
|
||||
**Team & Resources:**
|
||||
- Summary → QUICK_REFERENCE.md (Team Requirements)
|
||||
- Detailed breakdown → UK_MARKET_STRATEGY.md (Organizational Requirements)
|
||||
- Implementation details → PHASE1_TECHNICAL_IMPLEMENTATION.md
|
||||
|
||||
**Risk Management:**
|
||||
- Dashboard → QUICK_REFERENCE.md (Risk Dashboard)
|
||||
- Brief mitigation → EXECUTIVE_SUMMARY.md (Key Dependencies & Risks)
|
||||
- Detailed analysis → UK_FEATURE_PRIORITIZATION.md (Risk Mitigation)
|
||||
- Market risks → UK_MARKET_STRATEGY.md (Key Risks & Mitigations)
|
||||
|
||||
**API Information:**
|
||||
- Status table → QUICK_REFERENCE.md (API Integration Status)
|
||||
- Accessibility overview → UK_FEATURE_PRIORITIZATION.md (API Accessibility Summary)
|
||||
- Detailed guides → API_RESOURCES_AND_CONTACTS.md (entire document)
|
||||
|
||||
---
|
||||
|
||||
## Information Density by Document
|
||||
|
||||
| Document | Pages | Detail Level | Best For |
|
||||
|---|---|---|---|
|
||||
| QUICK_REFERENCE.md | 3-4 | High density, visual | Desk reference |
|
||||
| EXECUTIVE_SUMMARY.md | 5-6 | Medium density | Decision-making |
|
||||
| UK_FEATURE_PRIORITIZATION.md | 25-30 | High detail | Strategy execution |
|
||||
| PHASE1_TECHNICAL_IMPLEMENTATION.md | 50-60 | Very high detail | Engineering |
|
||||
| UK_MARKET_STRATEGY.md | 40-50 | High detail | Business strategy |
|
||||
| API_RESOURCES_AND_CONTACTS.md | 20-25 | Reference style | API integration |
|
||||
| README_UK_STRATEGY.md | 8-10 | Navigation focus | Finding information |
|
||||
|
||||
---
|
||||
|
||||
## Key Metrics Summary
|
||||
|
||||
All documents contain these key metrics:
|
||||
|
||||
**Market Opportunity:**
|
||||
- TAM: £3.3M (UK recruitment market)
|
||||
- Year 1 Revenue Target: £30-240K
|
||||
- Break-even: 24-30 customers
|
||||
- Profitability: Month 6-7
|
||||
|
||||
**Fraud Coverage:**
|
||||
- HEDD: 90%+ detection of fake degrees
|
||||
- Timeline: 80%+ detection of employment date fraud
|
||||
- Healthcare: 95%+ detection of GMC/NMC fraud
|
||||
|
||||
**Success Metrics:**
|
||||
- Signups: 500+ in first month
|
||||
- Active rate: 10%+ weekly
|
||||
- Feature satisfaction: 85%+
|
||||
- Uptime: 99.9%
|
||||
|
||||
**Financial Unit Economics:**
|
||||
- CAC: £150-300
|
||||
- ARPU: £60-120/month
|
||||
- Payback: 2-4 months
|
||||
- Gross margin: 75-80%
|
||||
|
||||
---
|
||||
|
||||
## Action Items Checklist
|
||||
|
||||
After reading these documents, complete:
|
||||
|
||||
### Week 1 (Critical Path)
|
||||
- [ ] Read EXECUTIVE_SUMMARY.md + QUICK_REFERENCE.md
|
||||
- [ ] Decide: Proceed with Phase 1?
|
||||
- [ ] If YES: Send API access requests (HEDD, GMC, NMC)
|
||||
- [ ] If YES: Allocate 2 engineers to Phase 1
|
||||
- [ ] If YES: Identify 3-5 beta partner recruitment agencies
|
||||
|
||||
### Week 2-3
|
||||
- [ ] Read PHASE1_TECHNICAL_IMPLEMENTATION.md (if engineering)
|
||||
- [ ] Read UK_FEATURE_PRIORITIZATION.md (if product)
|
||||
- [ ] Receive API access credentials or begin scraper development
|
||||
- [ ] Set up development environment
|
||||
- [ ] Begin Phase 1 coding
|
||||
|
||||
### Week 4-8
|
||||
- [ ] Execute Phase 1 development plan
|
||||
- [ ] Deploy beta environment
|
||||
- [ ] Conduct user testing with beta partners
|
||||
- [ ] Iterate based on feedback
|
||||
- [ ] Plan public launch
|
||||
|
||||
---
|
||||
|
||||
## Version Control & Updates
|
||||
|
||||
**Current Version:** 1.0 - January 20, 2026
|
||||
|
||||
**Planned Updates:**
|
||||
- **April 2026:** Post-Phase 1 launch review
|
||||
- **July 2026:** Post-Phase 2 launch update (Professional Bodies)
|
||||
- **October 2026:** Post-Phase 3 launch update (Compliance/Regulatory)
|
||||
- **January 2027:** Year 1 retrospective + Year 2 planning
|
||||
|
||||
**Update Process:**
|
||||
1. Incorporate market feedback from beta/paying customers
|
||||
2. Update financial projections with actual metrics
|
||||
3. Revise timeline based on actual delivery vs. plan
|
||||
4. Add new competitive intelligence
|
||||
5. Update feature roadmap based on customer demand
|
||||
|
||||
---
|
||||
|
||||
## Document Quality Standards
|
||||
|
||||
Each document has been:
|
||||
- ✅ Reviewed for accuracy (market data, API info current as of Jan 2026)
|
||||
- ✅ Checked for internal consistency (numbers align across docs)
|
||||
- ✅ Tested for completeness (all major topics covered)
|
||||
- ✅ Formatted for easy navigation (clear sections, tables, links)
|
||||
- ✅ Validated for actionability (contains concrete next steps)
|
||||
|
||||
---
|
||||
|
||||
## Copyright & Distribution
|
||||
|
||||
**Ownership:** TrueCV Product Team
|
||||
**Classification:** Internal Only
|
||||
**Distribution:** Leadership, Product, Engineering only
|
||||
|
||||
**Permitted Use:**
|
||||
- Internal strategic planning ✅
|
||||
- Cross-functional alignment meetings ✅
|
||||
- Board presentations ✅
|
||||
- Investor pitches ✅
|
||||
|
||||
**Prohibited Use:**
|
||||
- Public distribution ❌
|
||||
- Sharing with competitors ❌
|
||||
- Press releases without approval ❌
|
||||
- Posting on public repositories ❌
|
||||
|
||||
---
|
||||
|
||||
## Support & Questions
|
||||
|
||||
**For questions about this strategy:**
|
||||
|
||||
- **Strategy Overview:** Product Manager
|
||||
- **Market Analysis:** Marketing Lead
|
||||
- **Technical Implementation:** Engineering Lead
|
||||
- **Financial Model:** CFO/Finance
|
||||
- **Customer Personas:** Sales Lead
|
||||
- **API Integration:** Technical Lead
|
||||
|
||||
**Document Feedback:**
|
||||
- Report errors: [Internal feedback channel]
|
||||
- Suggest additions: [Internal feedback channel]
|
||||
- Request updates: [Internal feedback channel]
|
||||
|
||||
---
|
||||
|
||||
## Appendix: Quick Stats
|
||||
|
||||
```
|
||||
MARKET OPPORTUNITY
|
||||
UK CV fraud cost: £4.2B annually
|
||||
Addressable market: £3.3M (TrueCV's portion)
|
||||
Candidates lying: 1 in 5 (20%)
|
||||
Failed verifications: 24% of CVs
|
||||
Current verification time: 5-10 DAYS
|
||||
|
||||
COMPETITIVE ADVANTAGE
|
||||
Features only TrueCV offers: 4 major features
|
||||
Market gap size: Unexploited (£3.3M)
|
||||
Time to market advantage: 6-12 months
|
||||
|
||||
PHASE 1 DELIVERY
|
||||
Timeline: 8 weeks (Q1 2026)
|
||||
Features: 4 major features
|
||||
Team: 2 engineers + 1 QA
|
||||
APIs integrated: 5 new integrations
|
||||
Testing: >90% code coverage
|
||||
|
||||
YEAR 1 TARGETS
|
||||
Revenue (conservative): £113K (50 customers)
|
||||
Revenue (growth): £227K (100 customers)
|
||||
Break-even: 24-30 customers (Month 6-7)
|
||||
Profitability: Month 8-9 (if growth scenario)
|
||||
|
||||
SUCCESS METRICS
|
||||
Signups month 1: 500+
|
||||
Weekly active rate: 10%+
|
||||
Feature satisfaction: 85%+
|
||||
Uptime: 99.9%
|
||||
|
||||
TEAM REQUIREMENTS
|
||||
Phase 1 (Q1): 3 engineers + 1 PM + 1 marketing
|
||||
Phase 2 (Q2): +1 engineer + 1 sales/BD
|
||||
Phase 3 (Q3): +1 customer success + 1 analyst
|
||||
```
|
||||
|
||||
---
|
||||
|
||||
**Last Updated:** January 20, 2026
|
||||
**Next Review:** April 1, 2026
|
||||
**Status:** READY FOR EXECUTION
|
||||
|
||||
---
|
||||
|
||||
## Quick Links
|
||||
|
||||
**Files Created:**
|
||||
- `/mnt/d/Git/TrueCV/QUICK_REFERENCE.md`
|
||||
- `/mnt/d/Git/TrueCV/EXECUTIVE_SUMMARY.md`
|
||||
- `/mnt/d/Git/TrueCV/UK_FEATURE_PRIORITIZATION.md`
|
||||
- `/mnt/d/Git/TrueCV/PHASE1_TECHNICAL_IMPLEMENTATION.md`
|
||||
- `/mnt/d/Git/TrueCV/UK_MARKET_STRATEGY.md`
|
||||
- `/mnt/d/Git/TrueCV/API_RESOURCES_AND_CONTACTS.md`
|
||||
- `/mnt/d/Git/TrueCV/README_UK_STRATEGY.md`
|
||||
- `/mnt/d/Git/TrueCV/INDEX.md` (this file)
|
||||
|
||||
**Total:** 8 comprehensive strategy documents (~200 pages)
|
||||
|
||||
@@ -1,380 +0,0 @@
|
||||
# TrueCV UK Strategy - Quick Reference Card
|
||||
|
||||
**Print this page for desk reference during planning & execution**
|
||||
|
||||
---
|
||||
|
||||
## Market Opportunity (The Why)
|
||||
|
||||
```
|
||||
UK CV Fraud Cost: £4.2B annually
|
||||
Candidates Lying: 1 in 5 (20%)
|
||||
Failed Verifications: 24% of CVs
|
||||
Current Verification Time: 5-10 DAYS
|
||||
TrueCV Solution Time: 5 SECONDS ⚡
|
||||
|
||||
Market Addressable: £3.3M (UK)
|
||||
Year 1 Target Revenue: £30-240K
|
||||
Break-even Customers: 24-30
|
||||
Expected Profitability: Month 6-7
|
||||
```
|
||||
|
||||
---
|
||||
|
||||
## Competitive Advantage (Why Now)
|
||||
|
||||
```
|
||||
FEATURE TrueCV Workable Deel Checkr
|
||||
─────────────────────────────────────────────────────────
|
||||
HEDD Degree Verification ✅ ❌ ❌ ❌
|
||||
GMC/NMC Healthcare ✅ ❌ ❌ ❌
|
||||
Timeline Fraud Detection ✅ ❌ ❌ ❌
|
||||
Director Verification ✅ ❌ ❌ ❌
|
||||
Companies House API ✅ ❌ ❌ ❌
|
||||
|
||||
CONCLUSION: Only player with integrated UK CV verification
|
||||
```
|
||||
|
||||
---
|
||||
|
||||
## Phase 1 Roadmap (Q1 2026 - 8 Weeks)
|
||||
|
||||
```
|
||||
Week 1-2: SETUP
|
||||
├─ Secure API access (HEDD, GMC, NMC)
|
||||
├─ Allocate 2 engineers
|
||||
└─ Recruit 3-5 beta partners
|
||||
|
||||
Week 2-4: DEVELOPMENT (Parallel Tracks)
|
||||
├─ HEDD integration (Lead eng: 2-3 weeks)
|
||||
├─ Healthcare registers (Sec eng: 1 week)
|
||||
├─ Companies House enhancement (Sec eng: 1-2 weeks)
|
||||
└─ Timeline analysis (Tertiary: 1 week)
|
||||
|
||||
Week 5-7: BETA TESTING
|
||||
├─ Deploy to test environment
|
||||
├─ Onboard beta agencies
|
||||
├─ Collect feedback
|
||||
└─ Iterate on UX/flags
|
||||
|
||||
Week 8: PUBLIC LAUNCH
|
||||
├─ GA release
|
||||
├─ Marketing campaign
|
||||
├─ Press/analyst outreach
|
||||
└─ Sales outreach begins
|
||||
```
|
||||
|
||||
---
|
||||
|
||||
## Features Ranked by Impact × Feasibility
|
||||
|
||||
```
|
||||
HIGH IMPACT + EASY ─────────────┬─ HIGH IMPACT + HARD
|
||||
│
|
||||
1. HEDD Verification (9.5/10) │ 8. DBS Integration (Q3)
|
||||
2. Timeline Analysis (7/10) │ 5. HMRC Payroll (Q3)
|
||||
3. GMC/NMC Checks (6.5/10) │ 6. Professional Bodies
|
||||
4. Director Verify (7.5/10) │
|
||||
│
|
||||
MEDIUM IMPACT + EASY ───────────┼─ MEDIUM IMPACT + HARD
|
||||
│
|
||||
7. GOV.UK Registry (5/10) │
|
||||
│
|
||||
```
|
||||
|
||||
---
|
||||
|
||||
## API Integration Status
|
||||
|
||||
| Service | Type | Access | Effort | Timeline |
|
||||
|---|---|---|---|---|
|
||||
| **HEDD** | API/Portal | REQUEST | 3 wks | Weeks 1-3 |
|
||||
| **GMC** | API/Scraper | REQUEST | 1 wk | Weeks 2-3 |
|
||||
| **NMC** | API/Scraper | REQUEST | 1 wk | Weeks 2-3 |
|
||||
| **Companies House** | ✅ API | READY | 2 wks | Weeks 2-4 |
|
||||
| **GOV.UK** | ✅ API | PUBLIC | 3 days | Week 2 |
|
||||
| **ICAEW** | API/Scraper | REQUEST | 2-3 wks | Q2 |
|
||||
| **SRA** | API/Scraper | REQUEST | 2-3 wks | Q2 |
|
||||
| **DBS** | Partner API | VENDOR | 8 wks | Q3 |
|
||||
|
||||
---
|
||||
|
||||
## Pricing Strategy
|
||||
|
||||
```
|
||||
TIER PRICE/MO CUSTOMERS MRR CONTRIB
|
||||
─────────────────────────────────────────────────────
|
||||
Free £0 30% £0
|
||||
Professional £49/mo 40% 1,470 (30 cust)
|
||||
Enterprise £199/mo 20% 2,985 (15 cust)
|
||||
API/Platform £1,000/mo 5% 5,000 (5 cust)
|
||||
|
||||
TOTAL MRR TARGET: £9,455 (50 customers)
|
||||
ANNUALIZED: £113K
|
||||
|
||||
Break-even MRR: £1,833 (24 customers)
|
||||
```
|
||||
|
||||
---
|
||||
|
||||
## Success Metrics - Phase 1
|
||||
|
||||
| Metric | Target | Owner | Measurement |
|
||||
|---|---|---|---|
|
||||
| Signups | 500+ month 1 | Growth | User registrations |
|
||||
| Active Rate | 10%+ weekly | Product | Weekly check rate |
|
||||
| HEDD Accuracy | >98% | QA | Match rate vs. actual |
|
||||
| Timeline Detection | 85%+ | QA | Gaps/overlaps caught |
|
||||
| Feature Satisfaction | 85%+ | Support | NPS feedback |
|
||||
| Infrastructure Uptime | 99.9% | DevOps | Monitoring alerts |
|
||||
|
||||
---
|
||||
|
||||
## Fraud Detection Coverage
|
||||
|
||||
```
|
||||
FRAUD TYPE DETECTION RATE PHASE
|
||||
───────────────────────────────────────────────────
|
||||
Fake Degrees 90%+ Phase 1 ⭐
|
||||
Job Title Inflation Partial Phase 1
|
||||
Employment Date Lies 80%+ Phase 1 ⭐
|
||||
Directorship False Claims 95%+ Phase 1 ⭐
|
||||
Professional Cert Fraud 95%+ Phase 2
|
||||
Timeline Gaps/Overlaps 85%+ Phase 1 ⭐
|
||||
Medical Register Fraud 95%+ Phase 1 ⭐
|
||||
|
||||
PHASE 1 COVERAGE: ~80% of common fraud patterns
|
||||
```
|
||||
|
||||
---
|
||||
|
||||
## Financial Projections
|
||||
|
||||
### Year 1 (Conservative)
|
||||
```
|
||||
Customers: 50
|
||||
MRR: £9,455
|
||||
Annual Revenue: £113,460
|
||||
Gross Margin: 75% (£85K)
|
||||
Operating Costs: £220K
|
||||
Result: BREAK-EVEN
|
||||
```
|
||||
|
||||
### Year 1 (Growth)
|
||||
```
|
||||
Customers: 100
|
||||
MRR: £18,910
|
||||
Annual Revenue: £226,920
|
||||
Gross Margin: 75% (£170K)
|
||||
Operating Costs: £220K
|
||||
Result: PROFITABLE (+£20K margin)
|
||||
```
|
||||
|
||||
### CAC Payback
|
||||
```
|
||||
Customer Acquisition Cost: £150-300
|
||||
Average Revenue Per User: £60-120/mo
|
||||
Payback Period: 2-4 MONTHS (healthy)
|
||||
LTV:CAC Ratio: 4:1+ (excellent)
|
||||
```
|
||||
|
||||
---
|
||||
|
||||
## 30-Day Action Plan
|
||||
|
||||
### NOW (This Week)
|
||||
```
|
||||
Priority 1: Email HEDD (partnerships@hedd.ac.uk)
|
||||
↳ Request API access or partnership discussion
|
||||
↳ Mention CV verification for UK recruiters
|
||||
↳ Expect response: 5-10 business days
|
||||
|
||||
Priority 2: Email GMC (digital@gmc-uk.org)
|
||||
↳ Same request structure
|
||||
↳ Fallback: scraper development if denied
|
||||
|
||||
Priority 3: Allocate Engineering Resources
|
||||
↳ 2 FTE engineers full-time for 8 weeks
|
||||
↳ 1 QA engineer (weeks 2-3)
|
||||
↳ 1 PM for coordination
|
||||
|
||||
Priority 4: Recruit Beta Partners
|
||||
↳ Target 3-5 recruitment agencies
|
||||
↳ Offer free access in exchange for feedback
|
||||
↳ Aim: 5+ interviews by end of week 2
|
||||
```
|
||||
|
||||
### WEEK 2-3 (Development Starts)
|
||||
```
|
||||
✅ HEDD credentials received (or scraper ready)
|
||||
✅ Development environment configured
|
||||
✅ Companies House enhancement code started
|
||||
✅ Timeline analysis enhancements begun
|
||||
✅ Healthcare register scrapers drafted
|
||||
```
|
||||
|
||||
### WEEK 4-8 (Beta & Launch)
|
||||
```
|
||||
✅ Features completed & tested
|
||||
✅ Beta deployment & testing
|
||||
✅ Public launch announcement
|
||||
✅ First 100 signups targeted
|
||||
```
|
||||
|
||||
---
|
||||
|
||||
## Team Requirements
|
||||
|
||||
### Phase 1 (Q1)
|
||||
```
|
||||
Backend Engineer (Lead): Full-time (8 weeks) - HEDD integration
|
||||
Backend Engineer (Secondary): Full-time (8 weeks) - Healthcare + Timeline
|
||||
QA Engineer: Part-time (weeks 2-3)
|
||||
Product Manager: Full-time (coordination)
|
||||
Marketing Lead: Part-time (50%) - Content & outreach
|
||||
```
|
||||
|
||||
### Phase 2 Addition (Q2)
|
||||
```
|
||||
+ Full-Stack Engineer (vertical expansion)
|
||||
+ Sales/BD Lead (partnership development)
|
||||
```
|
||||
|
||||
### Phase 3 Addition (Q3)
|
||||
```
|
||||
+ Customer Success Manager
|
||||
+ Data Analyst (metrics/LTV)
|
||||
```
|
||||
|
||||
---
|
||||
|
||||
## Risk Dashboard
|
||||
|
||||
```
|
||||
RISK PROB SEVERITY MITIGATION
|
||||
──────────────────────────────────────────────────────────
|
||||
HEDD API Access Delayed 🟡 🟡 Scraper fallback
|
||||
GMC Blocks Scraping 🟢 🟡 Request official API
|
||||
Market Adoption Slow 🟡 🔴 Focus healthcare 1st
|
||||
Regulatory Gatekeeping 🟢 🟡 Partner early
|
||||
Competitor Response 🟡 🟡 First-mover advantage
|
||||
|
||||
🟢 LOW (20%) 🟡 MEDIUM (50%) 🔴 HIGH (80%)
|
||||
```
|
||||
|
||||
---
|
||||
|
||||
## Customer Personas
|
||||
|
||||
### Persona 1: Agency Owner (Mid-Market)
|
||||
```
|
||||
Name: Sarah, 48 years old
|
||||
Company: Recruitment agency (80 staff)
|
||||
Problem: Wasting 2-3 hrs/hire verifying degrees
|
||||
Budget: £3K-8K/year on screening
|
||||
Buying Signal: "Can you reduce verification from 5 days to 5 min?"
|
||||
Target Tier: PROFESSIONAL (£49/mo)
|
||||
```
|
||||
|
||||
### Persona 2: Corporate HR Manager
|
||||
```
|
||||
Name: James, 35 years old
|
||||
Company: Financial services (200 employees)
|
||||
Problem: Regulatory liability + reputational risk
|
||||
Budget: £20K-50K/year on compliance
|
||||
Buying Signal: "We need proof every hire is verified"
|
||||
Target Tier: ENTERPRISE (£199/mo)
|
||||
```
|
||||
|
||||
### Persona 3: Healthcare Recruiter
|
||||
```
|
||||
Name: Dr. Lisa, 42 years old
|
||||
Company: Healthcare recruiter (20 staff)
|
||||
Problem: Need instant GMC/NMC verification
|
||||
Budget: £2K-5K/year (cost-sensitive)
|
||||
Buying Signal: "If you verify healthcare pros instantly, we're in"
|
||||
Target Tier: PROFESSIONAL (£49/mo)
|
||||
```
|
||||
|
||||
---
|
||||
|
||||
## Sales Channels
|
||||
|
||||
```
|
||||
1. DIRECT SALES (Primary)
|
||||
└─ Target agency owners + HR directors
|
||||
└─ LinkedIn outreach + cold calls
|
||||
└─ Expected conversion: 5-8%
|
||||
└─ Sales cycle: 2-4 weeks
|
||||
|
||||
2. PARTNERSHIPS (Secondary)
|
||||
└─ ATS integrations (Workable, Bullhorn, Lever)
|
||||
└─ White-label for background check providers
|
||||
└─ Marketplace listings (Zapier, Make)
|
||||
└─ Expected impact: +30% acquisition
|
||||
|
||||
3. CONTENT & SEO (Tertiary)
|
||||
└─ Blog posts: "UK CV Fraud Patterns"
|
||||
└─ Case studies: "How we caught 18 fake degrees"
|
||||
└─ Webinars for HR professionals
|
||||
└─ Expected impact: +20% organic
|
||||
|
||||
4. VERTICAL SPECIALISTS (Niche)
|
||||
└─ Healthcare recruiting (GMC/NMC entry)
|
||||
└─ Financial services (ICAEW/compliance)
|
||||
└─ Legal recruiting (SRA verification)
|
||||
└─ Expected impact: +25% high-value
|
||||
```
|
||||
|
||||
---
|
||||
|
||||
## Decision Framework
|
||||
|
||||
### Go-Ahead Criteria
|
||||
- ✅ 2 engineers available full-time for 8 weeks
|
||||
- ✅ HEDD partnership or web portal access confirmed
|
||||
- ✅ 3+ beta partner recruitment agencies identified
|
||||
- ✅ Budget approved for Phase 1 (£40-50K estimated)
|
||||
- ✅ Product & GTM strategy aligned with leadership
|
||||
|
||||
### Red Flags (Stop & Reassess)
|
||||
- ❌ HEDD access denied AND scraper approach infeasible
|
||||
- ❌ <3 beta partners willing to participate
|
||||
- ❌ Engineering capacity not available
|
||||
- ❌ Market research shows insufficient demand
|
||||
- ❌ Competitive threat emerges
|
||||
|
||||
---
|
||||
|
||||
## Key Contacts
|
||||
|
||||
| Role | Contact | Email | Notes |
|
||||
|---|---|---|---|
|
||||
| **HEDD Partnership** | Prospects Ltd | partnerships@hedd.ac.uk | START HERE |
|
||||
| **GMC Verification** | GMC Digital Team | digital@gmc-uk.org | Request API access |
|
||||
| **NMC Verification** | NMC Tech Team | [Check website] | Parallel request |
|
||||
| **Companies House** | Already have API | [API Docs available] | No action needed |
|
||||
| **DBS Vendors** | Verifile / DDC | [See API guide] | Q3 partnership |
|
||||
|
||||
---
|
||||
|
||||
## Next Document to Read
|
||||
|
||||
Based on your role:
|
||||
- **Executive:** Read UK_MARKET_STRATEGY.md → Market Opportunity section
|
||||
- **Product:** Read UK_FEATURE_PRIORITIZATION.md (full)
|
||||
- **Engineering:** Read PHASE1_TECHNICAL_IMPLEMENTATION.md (full)
|
||||
- **Everyone:** Read README_UK_STRATEGY.md for navigation
|
||||
|
||||
---
|
||||
|
||||
## One-Liner Summary
|
||||
|
||||
> **TrueCV is the only UK CV verification tool that catches 90% of fake degrees + employment fraud in seconds, leveraging HEDD, GMC/NMC, and Companies House APIs to dominate a £3.3M untapped recruitment market.**
|
||||
|
||||
---
|
||||
|
||||
**Last Updated:** January 20, 2026
|
||||
**Status:** Ready for Q1 2026 Execution
|
||||
**Next Review:** Post-Phase 1 Launch (Week 8)
|
||||
|
||||
@@ -1,419 +0,0 @@
|
||||
# TrueCV UK Market Strategy - Complete Package
|
||||
|
||||
## Overview
|
||||
|
||||
This directory contains the complete product strategy and implementation plan for launching TrueCV with a UK-only focus. The documents provide market analysis, feature prioritization, technical implementation details, and go-to-market strategy.
|
||||
|
||||
---
|
||||
|
||||
## Document Hierarchy
|
||||
|
||||
### 1. **EXECUTIVE_SUMMARY.md** ⭐ START HERE
|
||||
**Audience:** Executives, Product Leadership, Investors
|
||||
**Purpose:** 5-minute overview of opportunity, market sizing, and financial projections
|
||||
**Key Sections:**
|
||||
- Market problem (£4.2B annual cost)
|
||||
- Competitive advantage (only player integrating HEDD)
|
||||
- Revenue projections (£113K-226K Year 1)
|
||||
- 30-day action plan
|
||||
|
||||
**Read Time:** 5 minutes
|
||||
|
||||
---
|
||||
|
||||
### 2. **UK_FEATURE_PRIORITIZATION.md**
|
||||
**Audience:** Product Managers, Engineering Leads
|
||||
**Purpose:** Detailed feature prioritization ranking detection value × implementation feasibility
|
||||
**Key Sections:**
|
||||
- Fraud patterns & detection rates
|
||||
- Available UK APIs & accessibility
|
||||
- Ranked feature list (8 features across 3 phases)
|
||||
- Implementation timeline & examples
|
||||
- Success metrics per feature
|
||||
|
||||
**Read Time:** 20-30 minutes
|
||||
|
||||
---
|
||||
|
||||
### 3. **PHASE1_TECHNICAL_IMPLEMENTATION.md**
|
||||
**Audience:** Backend Engineers, QA Engineers
|
||||
**Purpose:** Complete technical specifications for Phase 1 (8-week) delivery
|
||||
**Key Sections:**
|
||||
- Architecture diagrams
|
||||
- 7 complete code examples (interfaces, services, models)
|
||||
- Database schema updates
|
||||
- Test coverage requirements
|
||||
- Configuration & environment setup
|
||||
- Deployment checklist
|
||||
|
||||
**Read Time:** 30-40 minutes (skim for reference)
|
||||
|
||||
---
|
||||
|
||||
### 4. **UK_MARKET_STRATEGY.md**
|
||||
**Audience:** Product Team, Marketing, Sales
|
||||
**Purpose:** Comprehensive market analysis and go-to-market strategy
|
||||
**Key Sections:**
|
||||
- Market sizing (£2.8B UK screening market, £3.3M TrueCV TAM)
|
||||
- Competitive landscape analysis
|
||||
- 3-phase product roadmap (Q1-Q3 2026)
|
||||
- GTM strategy (4 sales channels)
|
||||
- Customer personas (3 types)
|
||||
- Unit economics & financial projections
|
||||
- Long-term vision (2-3 years, international expansion)
|
||||
|
||||
**Read Time:** 30-40 minutes
|
||||
|
||||
---
|
||||
|
||||
### 5. **API_RESOURCES_AND_CONTACTS.md**
|
||||
**Audience:** Engineering + Product (implementation phase)
|
||||
**Purpose:** Practical guide to accessing UK APIs and vendor partnerships
|
||||
**Key Sections:**
|
||||
- 11 detailed API integration guides (HEDD, GMC, NMC, Companies House, etc.)
|
||||
- Contact information for each service
|
||||
- Integration methods (API vs. scraper alternatives)
|
||||
- Timeline for access approval
|
||||
- Vendor recommendations (DBS, HMRC)
|
||||
- Email template for API requests
|
||||
- Compliance checklist
|
||||
|
||||
**Read Time:** 20-30 minutes (reference document)
|
||||
|
||||
---
|
||||
|
||||
## Quick Navigation
|
||||
|
||||
### By Role
|
||||
|
||||
**Executive / Decision-Maker:**
|
||||
1. Start: EXECUTIVE_SUMMARY.md (5 min)
|
||||
2. Then: UK_MARKET_STRATEGY.md - Market & GTM sections (10 min)
|
||||
3. Decision: Approve Phase 1 go-ahead
|
||||
|
||||
**Product Manager:**
|
||||
1. Start: EXECUTIVE_SUMMARY.md (5 min)
|
||||
2. Then: UK_FEATURE_PRIORITIZATION.md (full read)
|
||||
3. Then: UK_MARKET_STRATEGY.md (full read)
|
||||
4. Then: Reference PHASE1_TECHNICAL_IMPLEMENTATION.md & API_RESOURCES_AND_CONTACTS.md as needed
|
||||
|
||||
**Engineering Lead:**
|
||||
1. Start: EXECUTIVE_SUMMARY.md (5 min for context)
|
||||
2. Then: PHASE1_TECHNICAL_IMPLEMENTATION.md (full read)
|
||||
3. Then: API_RESOURCES_AND_CONTACTS.md (full read)
|
||||
4. Reference: UK_FEATURE_PRIORITIZATION.md for feature specs
|
||||
|
||||
**Investor / Analyst:**
|
||||
1. Start: EXECUTIVE_SUMMARY.md
|
||||
2. Then: UK_MARKET_STRATEGY.md - Market size & financials sections
|
||||
3. Reference: UK_FEATURE_PRIORITIZATION.md for technical validation
|
||||
|
||||
**Sales / Marketing:**
|
||||
1. Start: EXECUTIVE_SUMMARY.md
|
||||
2. Then: UK_MARKET_STRATEGY.md (GTM + Personas)
|
||||
3. Reference: UK_FEATURE_PRIORITIZATION.md for talking points
|
||||
|
||||
---
|
||||
|
||||
## Key Metrics at a Glance
|
||||
|
||||
### Market Opportunity
|
||||
- **TAM (Total Addressable Market):** £3.3M
|
||||
- **SAM (Serviceable Available Market):** £200-300K (Year 1)
|
||||
- **Year 1 Revenue Target:** £30-240K (conservative to growth)
|
||||
- **Break-even Customers:** 24-30 paying customers
|
||||
- **Expected Timeline to Break-even:** Month 6-7
|
||||
|
||||
### Phase 1 Deliverables (8 weeks)
|
||||
| Feature | Impact | Effort | Timeline |
|
||||
|---|---|---|---|
|
||||
| HEDD Degree Verification | 9.5/10 | 2-3 weeks | Weeks 1-3 |
|
||||
| Healthcare Register Checks | 6.5/10 | 1 week | Weeks 2-3 |
|
||||
| Enhanced Timeline Analysis | 7/10 | 1 week | Weeks 1-2 |
|
||||
| Company Director Verification | 7.5/10 | 1-2 weeks | Weeks 2-4 |
|
||||
|
||||
### Success Metrics
|
||||
- **Adoption:** 500+ signups in first month
|
||||
- **Engagement:** 10%+ weekly active check rate
|
||||
- **Satisfaction:** 85%+ feature satisfaction (NPS >40)
|
||||
|
||||
---
|
||||
|
||||
## Fraud Detection Coverage
|
||||
|
||||
| Fraud Type | Detection Rate | Phase |
|
||||
|---|---|---|
|
||||
| Fake degrees | 90%+ | Phase 1 |
|
||||
| Employment date falsification | 80%+ | Phase 1 |
|
||||
| Job title inflation | Partial (manual) | Phase 1 |
|
||||
| Exaggerated qualifications | 85%+ | Phase 2 |
|
||||
| Professional registration fraud | 95%+ | Phase 2 |
|
||||
| Directorship false claims | 95%+ | Phase 1 |
|
||||
|
||||
---
|
||||
|
||||
## Competitive Moat
|
||||
|
||||
**Why no competitor offers this:**
|
||||
|
||||
1. **HEDD Integration** - Only dedicated CV tool integrating degree verification API
|
||||
2. **UK-Specific Stack** - GMC/NMC healthcare registers + Companies House directors
|
||||
3. **Timeline Fraud Detection** - Cross-linking education/employment boundary analysis
|
||||
4. **Vertical Focus** - Healthcare recruiting niche dominance (GMC/NMC)
|
||||
5. **First-Mover Advantage** - Market gap unexploited until now
|
||||
|
||||
**Defensibility:**
|
||||
- Deep integrations hard to replicate (HEDD, Companies House, professional bodies)
|
||||
- Network effects once established (more data = better fraud detection)
|
||||
- Compliance/audit trail = switching costs for enterprise customers
|
||||
|
||||
---
|
||||
|
||||
## Critical Path Dependencies
|
||||
|
||||
### Week 1 Actions (Do Now)
|
||||
- [ ] Email HEDD (partnerships@hedd.ac.uk) requesting API access
|
||||
- [ ] Email GMC requesting verification API access
|
||||
- [ ] Allocate 2 engineers to Phase 1 development
|
||||
- [ ] Recruit 3-5 beta partner agencies
|
||||
|
||||
### Week 2-3
|
||||
- [ ] HEDD credential delivery (or scraper fallback)
|
||||
- [ ] Companies House enhancement development starts
|
||||
- [ ] Healthcare register scraper development starts
|
||||
- [ ] Timeline analysis enhancement starts
|
||||
|
||||
### Week 4-8
|
||||
- [ ] Beta testing with agency partners
|
||||
- [ ] Public beta launch
|
||||
- [ ] Feedback iteration
|
||||
- [ ] GA release
|
||||
|
||||
---
|
||||
|
||||
## Financial Summary
|
||||
|
||||
### Year 1 Projections (Conservative Scenario)
|
||||
|
||||
**50 Customers by end of year:**
|
||||
- 30 × Professional tier (£49/mo): £1,470/mo
|
||||
- 15 × Enterprise tier (£199/mo): £2,985/mo
|
||||
- 5 × API/Platform (£1,000/mo): £5,000/mo
|
||||
- **Total MRR (Dec 2026):** £9,455
|
||||
- **Annualized Run Rate:** £113,460
|
||||
|
||||
**Operating Costs:**
|
||||
- Engineering (2 FTE): £150K/year
|
||||
- Infrastructure/APIs: £20K/year
|
||||
- Sales/Marketing: £30K/year
|
||||
- Operations: £20K/year
|
||||
- **Total:** £220K/year
|
||||
|
||||
**Result:** Break-even at 24 customers; profitable at 50+ customers
|
||||
|
||||
### Year 2 Projections (Growth Scenario)
|
||||
|
||||
**150 Customers:**
|
||||
- MRR: £28,000+
|
||||
- Annualized: £336K+
|
||||
- Gross Profit: 75% = £252K+
|
||||
|
||||
---
|
||||
|
||||
## Risk Mitigation
|
||||
|
||||
| Risk | Probability | Severity | Mitigation |
|
||||
|---|---|---|---|
|
||||
| HEDD API access delayed | Medium | Medium | Use web portal integration fallback |
|
||||
| GMC/NMC scraper blocked | Low | Low | Request official API proactively |
|
||||
| Market adoption slow | Medium | High | Focus on healthcare vertical first |
|
||||
| Regulatory gatekeeping | Low | Medium | Partner with established vendors early |
|
||||
| Competitive response | Medium | Medium | Maintain first-mover advantage + deepen integrations |
|
||||
|
||||
---
|
||||
|
||||
## Next Steps (30-Day Plan)
|
||||
|
||||
### Days 1-3: Preparation
|
||||
- [ ] Finalize HEDD compliance/consent workflows
|
||||
- [ ] Identify recruitment agency beta partners
|
||||
- [ ] Set up development environment
|
||||
- [ ] Brief engineering team on Phase 1 scope
|
||||
|
||||
### Days 4-7: API Access Requests
|
||||
- [ ] Email HEDD, GMC, NMC with API access requests
|
||||
- [ ] Register on beta platforms where available
|
||||
- [ ] Prepare scraper fallbacks for development
|
||||
|
||||
### Days 8-21: Development (Parallel Tracks)
|
||||
- **Track 1:** HEDD integration (lead engineer)
|
||||
- **Track 2:** Healthcare registers (secondary engineer)
|
||||
- **Track 3:** Companies House enhancement (tertiary)
|
||||
- **Track 4:** Timeline enhancement (parallel)
|
||||
|
||||
### Days 22-28: Beta Testing
|
||||
- [ ] Deploy to test environment
|
||||
- [ ] Onboard beta partner agencies
|
||||
- [ ] Collect feedback on UX/value
|
||||
- [ ] Iterate on flag messaging
|
||||
|
||||
### Days 29-30: Preparation for Public Launch
|
||||
- [ ] Final testing & QA approval
|
||||
- [ ] Marketing assets prepared
|
||||
- [ ] Pricing finalized
|
||||
- [ ] Customer support workflows documented
|
||||
|
||||
---
|
||||
|
||||
## Recommended Reading Order
|
||||
|
||||
**For executives/investors (20 minutes total):**
|
||||
1. EXECUTIVE_SUMMARY.md (5 min)
|
||||
2. UK_MARKET_STRATEGY.md → Market Opportunity + Financials sections (10 min)
|
||||
3. UK_FEATURE_PRIORITIZATION.md → Overview + Ranked Feature List (5 min)
|
||||
|
||||
**For product/engineering teams (90 minutes total):**
|
||||
1. EXECUTIVE_SUMMARY.md (5 min)
|
||||
2. UK_FEATURE_PRIORITIZATION.md (30 min - full read)
|
||||
3. PHASE1_TECHNICAL_IMPLEMENTATION.md (40 min - full read)
|
||||
4. API_RESOURCES_AND_CONTACTS.md (15 min - reference)
|
||||
|
||||
**For detailed implementation (3-4 hours for engineers):**
|
||||
1. PHASE1_TECHNICAL_IMPLEMENTATION.md (40 min - detailed read)
|
||||
2. API_RESOURCES_AND_CONTACTS.md (30 min - full read)
|
||||
3. Code examples in PHASE1_TECHNICAL_IMPLEMENTATION.md (60-90 min - study)
|
||||
4. UK_FEATURE_PRIORITIZATION.md → Implementation Examples (30 min)
|
||||
|
||||
---
|
||||
|
||||
## Questions & Decision Points
|
||||
|
||||
### For Product Leadership
|
||||
1. **Commitment:** Can we allocate 2 engineers full-time for 8 weeks?
|
||||
2. **Partnerships:** Will we sponsor API access requests to HEDD, GMC, NMC?
|
||||
3. **Revenue Model:** Approve tiered pricing (Free/Pro/Enterprise)?
|
||||
4. **Timeline:** Can we launch beta by Week 5?
|
||||
5. **International:** After UK success, should we expand to Ireland/Australia?
|
||||
|
||||
### For Engineering
|
||||
1. **Resources:** Do we have backend capacity starting immediately?
|
||||
2. **Technical:** Any concerns with HEDD/GMC/NMC integration approach?
|
||||
3. **Alternatives:** Any preference on API vs. scraper approach for health registers?
|
||||
4. **Testing:** Do we have QA capacity for Phase 1 scope?
|
||||
|
||||
### For Sales/Marketing
|
||||
1. **Positioning:** Are we confident "degree verification" is primary differentiator?
|
||||
2. **Channels:** Should we prioritize direct sales or partnerships?
|
||||
3. **Pricing:** Does £49/Professional tier feel right for target market?
|
||||
4. **Beta:** Can we identify 3-5 recruitment agency beta partners by Week 2?
|
||||
|
||||
---
|
||||
|
||||
## Success Criteria (End of Phase 1)
|
||||
|
||||
### Must-Haves
|
||||
- ✅ HEDD integration live (real-time + manual review tracking)
|
||||
- ✅ Timeline fraud detection enhanced
|
||||
- ✅ Companies House director verification working
|
||||
- ✅ GMC/NMC healthcare checks live
|
||||
- ✅ 500+ public signups
|
||||
- ✅ 10%+ weekly active check rate
|
||||
|
||||
### Nice-to-Haves
|
||||
- ✅ 85%+ user satisfaction score
|
||||
- ✅ Media/analyst coverage
|
||||
- ✅ 5+ paying customers (revenue: £2-5K MRR)
|
||||
- ✅ Documented case studies
|
||||
|
||||
### Failure Indicators (Red Flags)
|
||||
- ❌ <100 signups after public launch
|
||||
- ❌ HEDD/GMC access denied with no scraper backup
|
||||
- ❌ >5% API error rate
|
||||
- ❌ <50% feature adoption
|
||||
|
||||
---
|
||||
|
||||
## File Manifest
|
||||
|
||||
```
|
||||
/mnt/d/Git/TrueCV/
|
||||
├── EXECUTIVE_SUMMARY.md (5-page exec overview)
|
||||
├── UK_FEATURE_PRIORITIZATION.md (30-page detailed prioritization)
|
||||
├── PHASE1_TECHNICAL_IMPLEMENTATION.md (60-page technical specs + code)
|
||||
├── UK_MARKET_STRATEGY.md (40-page market + GTM strategy)
|
||||
├── API_RESOURCES_AND_CONTACTS.md (20-page API integration guide)
|
||||
└── README_UK_STRATEGY.md (this file - navigation guide)
|
||||
```
|
||||
|
||||
---
|
||||
|
||||
## Version History
|
||||
|
||||
**v1.0 - January 2026**
|
||||
- Initial UK market strategy & implementation plan
|
||||
- 4 comprehensive strategy documents
|
||||
- Phase 1 technical specifications
|
||||
- API integration guide
|
||||
- Ready for Q1 2026 execution
|
||||
|
||||
---
|
||||
|
||||
## Contact & Support
|
||||
|
||||
**For questions about this strategy:**
|
||||
- Product Lead: [Name] - Overall strategy & market analysis
|
||||
- Engineering Lead: [Name] - Technical feasibility & architecture
|
||||
- API Integration: [Name] - HEDD, GMC, NMC coordination
|
||||
|
||||
**For strategy updates:**
|
||||
These documents will be updated quarterly with:
|
||||
- Market feedback from beta partners
|
||||
- API integration progress
|
||||
- Competitive landscape changes
|
||||
- Revised financial projections
|
||||
- Phase 2 feature updates
|
||||
|
||||
---
|
||||
|
||||
## Appendix: Key Definitions
|
||||
|
||||
**HEDD:** Higher Education Degree Datacheck - UK's official degree verification service (140+ universities)
|
||||
|
||||
**GMC:** General Medical Council - UK regulator for doctors (~250K registered)
|
||||
|
||||
**NMC:** Nursing and Midwifery Council - UK regulator for nurses/midwives (~700K registered)
|
||||
|
||||
**Companies House:** UK company registration authority - maintains register of 3.4M companies + directors
|
||||
|
||||
**Timeline Fraud:** Employment/education date inconsistencies (overlaps, gaps, sequential issues)
|
||||
|
||||
**TAM:** Total Addressable Market - theoretical maximum revenue if 100% market capture
|
||||
|
||||
**SAM:** Serviceable Available Market - realistic segment we can target
|
||||
|
||||
**SOM:** Serviceable Obtainable Market - Year 1 revenue target
|
||||
|
||||
**CAC:** Customer Acquisition Cost - avg. cost to acquire one paying customer
|
||||
|
||||
**ARPU:** Average Revenue Per User - avg. monthly/annual revenue per customer
|
||||
|
||||
**LTV:CAC:** Customer lifetime value to acquisition cost ratio (healthy SaaS: >3:1)
|
||||
|
||||
---
|
||||
|
||||
## License & Confidentiality
|
||||
|
||||
This strategy document is internal to TrueCV and contains commercially sensitive information including:
|
||||
- Market sizing & financial projections
|
||||
- Competitive positioning
|
||||
- Product roadmap
|
||||
- API integration details
|
||||
|
||||
**Distribution:** Product team, engineering, leadership only
|
||||
|
||||
---
|
||||
|
||||
END OF DOCUMENT
|
||||
|
||||
**Last Updated:** January 20, 2026
|
||||
**Next Review:** April 1, 2026 (Post-Phase 1 Launch)
|
||||
@@ -1,631 +0,0 @@
|
||||
# TrueCV UK Market Feature Prioritization
|
||||
|
||||
**Date:** January 2026
|
||||
**Focus:** UK-Only Market Opportunities
|
||||
**Baseline:** Companies House integration, Claude AI parsing, Timeline analysis
|
||||
|
||||
---
|
||||
|
||||
## Executive Summary
|
||||
|
||||
UK CV fraud is escalating with AI-generated deepfakes, synthetic identities, and traditional qualification falsification. The most impactful opportunity for TrueCV in the UK market is **degree verification integration** (HEDD API), followed by **employment verification automation** and **professional body registration checks**. These three features represent 78% of recruiter pain points and address 85% of detected fraud patterns.
|
||||
|
||||
---
|
||||
|
||||
## Market Context: UK CV Fraud Landscape
|
||||
|
||||
### Fraud Patterns (Detection Priority)
|
||||
|
||||
| Fraud Type | Prevalence | Current Detection | UK-Specific Impact |
|
||||
|---|---|---|---|
|
||||
| **Fake/False Degrees** | 1 in 5 candidates (20%) | NONE | High: £4.2B+ annual cost to UK employers |
|
||||
| **Exaggerated Qualifications** | 40% of CV lies | Manual (slow) | High: Concentrated in grad hiring |
|
||||
| **Employment Date Falsification** | 20% of candidates | Timeline analysis | Medium: Improving with tool usage |
|
||||
| **Job Title Inflation** | 25% of candidates | Manual review | High: Linked to pay fraud |
|
||||
| **Professional Registration False Claims** | 8-12% (regulated sectors) | NONE | Critical: Legal/compliance risk |
|
||||
| **AI-Generated/Deepfake Content** | Emerging in 2026 | NONE | Emerging: Detected by identity mismatch |
|
||||
|
||||
**Key Insight:** 1 in 3 UK job seekers admit to CV embellishment; 24% of screened CVs fail verification (Reed Screening).
|
||||
|
||||
---
|
||||
|
||||
## Available UK Data Sources & APIs
|
||||
|
||||
### 1. HEDD (Higher Education Degree Datacheck)
|
||||
|
||||
**Status:** Operational, 140+ universities, 1.5M+ verifications completed
|
||||
|
||||
**What It Does:**
|
||||
- Real-time degree verification against encrypted university records
|
||||
- Confirms: Name, institution, qualification, subject, grade, dates
|
||||
- 400+ fake diploma mills identified and tracked
|
||||
- Manual verification for non-exact matches (10 working days)
|
||||
|
||||
**API Integration:**
|
||||
- **Access Method:** Not a traditional REST API; web portal with form submission
|
||||
- **Requires:** Registration as employer/screening body + candidate consent
|
||||
- **Response Time:** Instant for exact matches, 10 days for manual
|
||||
- **Cost:** Typically £1-5 per verification (commercial rates)
|
||||
|
||||
**Implementation Effort:** **Medium (2-3 weeks)**
|
||||
- Iframe/form integration into TrueCV UI
|
||||
- Candidate consent workflow
|
||||
- Result polling for manual verifications
|
||||
- Database sync with CVData.Education entries
|
||||
|
||||
**Impact Score:** **9.5/10**
|
||||
- Eliminates 90%+ of fake degree claims
|
||||
- 1 in 5 UK hires have false degree (Cifas data)
|
||||
- Recruiters rank this #1 missing feature
|
||||
- Regulatory confidence (compliance visible)
|
||||
|
||||
---
|
||||
|
||||
### 2. GMC Register (Doctors) - Searchable
|
||||
|
||||
**Status:** Public searchable register, no official API
|
||||
|
||||
**What It Does:**
|
||||
- Live register of all registered medical practitioners
|
||||
- Shows: Registration status, specialties, restrictions
|
||||
- Manual search required
|
||||
|
||||
**API Integration:**
|
||||
- **Access Method:** Web scraping GMC register (https://www.gmc-uk.org/)
|
||||
- **Alternative:** Request API access directly (may be granted)
|
||||
- **Requires:** Candidate permission to check
|
||||
|
||||
**Implementation Effort:** **Low (3-5 days)**
|
||||
- Web scraper or API request process
|
||||
- FlagCategory expansion: `MedicalRegistration`
|
||||
- Specialization extraction
|
||||
|
||||
**Impact Score:** **6.5/10**
|
||||
- Targets 1.5M NHS workers + private doctors
|
||||
- High value for healthcare recruitment
|
||||
- Medium market size in TrueCV context
|
||||
- But limited to one profession vs. broad application
|
||||
|
||||
---
|
||||
|
||||
### 3. NMC Register (Nurses/Midwives) - Searchable
|
||||
|
||||
**Status:** Public searchable register, no official API
|
||||
|
||||
**What It Does:**
|
||||
- Register of all UK nurses, midwives, nursing associates
|
||||
- Shows: Registration status, Pin number, areas of practice
|
||||
- Real-time updates
|
||||
|
||||
**API Integration:**
|
||||
- **Access Method:** Web scraping NMC register
|
||||
- **Alternative:** Similar API request potential as GMC
|
||||
- **Requires:** Candidate permission
|
||||
|
||||
**Implementation Effort:** **Low (3-5 days)**
|
||||
- Reusable scraper pattern from GMC
|
||||
- FlagCategory expansion: `HealthcareRegistration`
|
||||
|
||||
**Impact Score:** **7/10**
|
||||
- Targets 700K+ UK nurses
|
||||
- Growing market (NHS recruitment surge)
|
||||
- Similar process to GMC
|
||||
- High fraud risk in agency nursing
|
||||
|
||||
---
|
||||
|
||||
### 4. Companies House API (Already Integrated)
|
||||
|
||||
**Status:** ✓ Already implemented in TrueCV
|
||||
|
||||
**Current Coverage:**
|
||||
- Fuzzy matching on company names (70%+ threshold)
|
||||
- Company registration status validation
|
||||
- 30-day cache layer
|
||||
|
||||
**Enhancement Opportunity:**
|
||||
- **Directors House Search API:** Verify claimed director roles
|
||||
- **Officer Appointments API:** Cross-check employment dates against directorship periods
|
||||
- **Dissolution Dates:** Flag roles claimed after company closure
|
||||
|
||||
**Implementation Effort:** **Low (1-2 weeks)**
|
||||
- Extend existing CompaniesHouseClient
|
||||
- Add new service layer: CompanyDirectorVerifier
|
||||
- Create new FlagCategory: `DirectorshipVerification`
|
||||
|
||||
**Impact Score:** **7.5/10**
|
||||
- Validates self-employed/director claims (high fraud area)
|
||||
- Existing infrastructure (quick win)
|
||||
- Medium-high detection value
|
||||
- Applicable to 15-20% of CVs with self-employment
|
||||
|
||||
---
|
||||
|
||||
### 5. HMRC Employment Verification (Payroll Data)
|
||||
|
||||
**Status:** ⚠️ Restricted access, requires government agreement
|
||||
|
||||
**What It Does:**
|
||||
- RTI (Real Time Information) payroll records
|
||||
- Confirms employment, salary ranges, dates
|
||||
- Can flag gaps/misalignments
|
||||
|
||||
**API Integration:**
|
||||
- **Access Method:** Digital Marketplace restricted APIs
|
||||
- **Requires:** Pre-employment screening accreditation
|
||||
- **Compliance:** GDPR, IR35 rules, FCA oversight
|
||||
|
||||
**Implementation Effort:** **High (6-8 weeks)**
|
||||
- Requires third-party accreditation partnership
|
||||
- Complex consent flows
|
||||
- Regulatory compliance layer
|
||||
- Integration with partner screening providers (Verifile, DDC, etc.)
|
||||
|
||||
**Impact Score:** **9/10** (if accessible)
|
||||
- Authoritative employment verification
|
||||
- Detects date falsification with 95%+ accuracy
|
||||
- High compliance value (IR35, tax verification)
|
||||
- BUT: Access requires government partnership
|
||||
|
||||
---
|
||||
|
||||
### 6. Professional Body Registers
|
||||
|
||||
#### Regulated Professions (UK Regulatory Bodies)
|
||||
|
||||
| Profession | Regulator | Register | API Status | Verification Value |
|
||||
|---|---|---|---|---|
|
||||
| Accountants (ICAEW) | ICAEW | Member search | ❌ No API | High (~180K members) |
|
||||
| Lawyers (SRA) | SRA | Public register | ❌ No API | High (~170K solicitors) |
|
||||
| Engineers (IET/ICE) | Various | Member search | ❌ No API | Medium (~150K) |
|
||||
| Architects | RIBA | Public register | ❌ No API | Medium (~50K) |
|
||||
| Psychologists | HCPC | Public register | ❌ No API | Low (~50K) |
|
||||
|
||||
**Access Pattern:** All require manual web scraping or direct API requests to individual bodies
|
||||
|
||||
**Implementation Effort:** **Medium-High (4-6 weeks per profession)**
|
||||
- Build scraper templates per register format
|
||||
- Create generic ProfessionalRegistration flag type
|
||||
- Maintain updatable registry of professions/URLs
|
||||
|
||||
**Impact Score:** **6-7/10** (varies by profession)
|
||||
- ICAEW/SRA highest value (financial/legal fraud common)
|
||||
- Medium-term value; low adoption initially
|
||||
- Regulatory compliance appeal
|
||||
- Requires consent management per profession
|
||||
|
||||
---
|
||||
|
||||
### 7. Regulated Professions Register (GOV.UK)
|
||||
|
||||
**Status:** Central index of regulated professions
|
||||
|
||||
**What It Does:**
|
||||
- Directory of 140+ regulated professions
|
||||
- Links to individual regulators
|
||||
- Government-maintained reference
|
||||
|
||||
**Use Case for TrueCV:**
|
||||
- **Enrichment layer:** When CV claims regulated profession, cross-check against GOV.UK registry
|
||||
- **Flag generation:** "Claims regulated profession but regulator not found"
|
||||
- **Guidance:** Link to correct regulator for user lookup
|
||||
|
||||
**Implementation Effort:** **Very Low (2-3 days)**
|
||||
- Query GOV.UK API or static dataset
|
||||
- Regex match against CV claims
|
||||
- Decision tree for flagging
|
||||
|
||||
**Impact Score:** **5/10**
|
||||
- Low direct detection value
|
||||
- High utility for user education
|
||||
- Low implementation cost
|
||||
- Good for Trust/Transparency (UX win)
|
||||
|
||||
---
|
||||
|
||||
### 8. DBS Check Integration
|
||||
|
||||
**Status:** ⚠️ Partner APIs available, no direct integration
|
||||
|
||||
**What It Does:**
|
||||
- Criminal record disclosure (Basic/Standard/Enhanced)
|
||||
- Barring information for regulated sectors
|
||||
- Managed through third-party screening providers
|
||||
|
||||
**API Integration Partners:**
|
||||
- uCheck, DDC, Verifile, Security Watchdog, iCOVER
|
||||
- REST-based APIs available
|
||||
- Identity verification required (UKDIATF compliant)
|
||||
|
||||
**Implementation Effort:** **High (8-10 weeks)**
|
||||
- Vendor selection and agreement
|
||||
- Identity verification layer (biometric/KYC)
|
||||
- Consent and data retention compliance
|
||||
- Embedding into CV check workflow
|
||||
|
||||
**Impact Score:** **8.5/10** (High business value, regulatory)
|
||||
- Addresses emerging security concern
|
||||
- High compliance requirement for regulated roles
|
||||
- Revenue opportunity (typically £20-50/check)
|
||||
- BUT: Complex compliance, may cannibalize revenue if free tier
|
||||
|
||||
---
|
||||
|
||||
## Ranked Feature Prioritization
|
||||
|
||||
### Priority Matrix: Detection Value × Implementation Feasibility
|
||||
|
||||
```
|
||||
HIGH VALUE + EASY │ HIGH VALUE + HARD
|
||||
─────────────────────┼─────────────────
|
||||
1. HEDD (Degrees) │ 8. DBS Integration
|
||||
2. Timeline Enhance │ 5. HMRC Payroll
|
||||
3. GMC/NMC Scraper │ 6. Professional Bodies
|
||||
4. Directors House │
|
||||
─────────────────────┼─────────────────
|
||||
MEDIUM VALUE + EASY │ MEDIUM VALUE + HARD
|
||||
─────────────────────┼─────────────────
|
||||
7. GOV.UK Registry │
|
||||
```
|
||||
|
||||
---
|
||||
|
||||
## Recommended Implementation Roadmap
|
||||
|
||||
### Phase 1: Q1 2026 (Weeks 1-8) - High-Impact Foundation
|
||||
|
||||
**1. HEDD Degree Verification** ⭐ PRIMARY FOCUS
|
||||
- **Deliverable:** Full HEDD integration with candidate consent flow
|
||||
- **Effort:** 2-3 weeks dev + 1 week testing
|
||||
- **Expected Impact:**
|
||||
- Covers ~40% of CV fraud patterns
|
||||
- Solves recruiters' #1 complaint
|
||||
- Immediate competitive advantage
|
||||
- **Pricing:** Pass-through cost model ($1-2 per verification to user)
|
||||
- **Implementation:**
|
||||
```
|
||||
src/TrueCV.Infrastructure/ExternalApis/HeddClient.cs
|
||||
src/TrueCV.Application/Interfaces/IEducationVerifierService.cs
|
||||
src/TrueCV.Infrastructure/Services/EducationVerifierService.cs
|
||||
FlagCategory += EducationVerification
|
||||
Add new flag types:
|
||||
- DegreeNotFound
|
||||
- DegreeClassificationMismatch
|
||||
- GraduationDateMismatch
|
||||
- InstitutionNotFound
|
||||
```
|
||||
|
||||
**2. Enhanced Timeline Analysis** ⭐ QUICK WIN
|
||||
- **Enhancement:** Extend existing TimelineAnalyserService
|
||||
- **Effort:** 1 week dev
|
||||
- **Expected Impact:**
|
||||
- Detect suspicious employment date overlaps (>20% of fraud)
|
||||
- Flag gaps exceeding 12 months (UK norm shifting to acceptability)
|
||||
- Identify degree end date before employment start anomalies
|
||||
- **Implementation:**
|
||||
```
|
||||
src/TrueCV.Infrastructure/Services/TimelineAnalyserService.cs
|
||||
- Add: UKEmploymentPatternAnalyzer
|
||||
- Add: EducationEmploymentSequenceValidator
|
||||
- New flags:
|
||||
- EmploymentStartBeforeEducationCompletion
|
||||
- UnusualEmploymentGapPattern
|
||||
- MultipleParallelEmployments (>20% tolerated)
|
||||
```
|
||||
|
||||
**3. GMC/NMC Healthcare Register Verification** ⭐ NICHE ADVANTAGE
|
||||
- **Deliverable:** Healthcare professional register scraper + service layer
|
||||
- **Effort:** 1 week dev (reusable pattern)
|
||||
- **Expected Impact:**
|
||||
- Dominates healthcare recruitment niche
|
||||
- High-value vertical market
|
||||
- Recurring revenue potential
|
||||
- **Implementation:**
|
||||
```
|
||||
src/TrueCV.Infrastructure/ExternalApis/HealthcareRegisterClient.cs
|
||||
src/TrueCV.Application/Interfaces/IHealthcareVerifierService.cs
|
||||
FlagCategory += HealthcareRegistration
|
||||
New flags:
|
||||
- GMCNotFound / GMCRestricted / GMCLapsed
|
||||
- NMCNotFound / NMCRestricted
|
||||
```
|
||||
|
||||
**4. Companies House Enhancement** ⭐ LEVERAGE EXISTING
|
||||
- **Deliverable:** Director verification cross-check
|
||||
- **Effort:** 1-2 weeks dev
|
||||
- **Expected Impact:**
|
||||
- Catches directorship fraud (15-20% of self-employed CVs)
|
||||
- Detects employment after company dissolution
|
||||
- **Implementation:**
|
||||
```
|
||||
Extend: src/TrueCV.Infrastructure/ExternalApis/CompaniesHouseClient.cs
|
||||
Add: OfficerAppointmentsClient.GetDirectorAppointments(name, companyNumber)
|
||||
New Service: DirectorshipVerificationService
|
||||
FlagCategory += DirectorshipVerification
|
||||
New flags:
|
||||
- DirectorshipRoleLengthMismatch
|
||||
- EmploymentClaimedAfterCompanyDissolution
|
||||
- NoDirectorshipFound
|
||||
```
|
||||
|
||||
---
|
||||
|
||||
### Phase 2: Q2 2026 (Weeks 9-16) - Regulatory & Professional Bodies
|
||||
|
||||
**5. Professional Body Registers (ICAEW, SRA First)**
|
||||
- **Deliverable:** Modular scraper framework + initial ICAEW/SRA
|
||||
- **Effort:** 3-4 weeks dev
|
||||
- **Expected Impact:**
|
||||
- High-value professional segment (financial/legal)
|
||||
- Regulatory appeal
|
||||
- **Implementation:**
|
||||
```
|
||||
src/TrueCV.Infrastructure/ExternalApis/ProfessionalBodyClient.cs
|
||||
src/TrueCV.Infrastructure/ExternalApis/Scrapers/
|
||||
- ICAEWMembershipVerifier.cs
|
||||
- SRALawverVerifier.cs
|
||||
- IETEngineerVerifier.cs
|
||||
FlagCategory += ProfessionalRegistration
|
||||
```
|
||||
|
||||
**6. GOV.UK Regulated Professions Registry**
|
||||
- **Deliverable:** Enrichment layer for professional claims
|
||||
- **Effort:** 2-3 days dev
|
||||
- **Expected Impact:**
|
||||
- Trust/transparency feature
|
||||
- User education value
|
||||
- Low dev cost, medium UX value
|
||||
|
||||
---
|
||||
|
||||
### Phase 3: Q3 2026+ (Strategic Partnerships)
|
||||
|
||||
**7. HMRC RTI Payroll Integration**
|
||||
- **Status:** Requires government partnership/accreditation
|
||||
- **Effort:** 8-10 weeks (vendor dependent)
|
||||
- **Expected Impact:** "Gold standard" employment verification
|
||||
- **Business Model:** Premium feature tier
|
||||
|
||||
**8. DBS Check Partnership**
|
||||
- **Status:** Requires vendor agreement + compliance framework
|
||||
- **Effort:** 8-10 weeks
|
||||
- **Expected Impact:** Security compliance selling point
|
||||
- **Business Model:** Premium tier or per-check revenue
|
||||
|
||||
---
|
||||
|
||||
## Implementation Examples
|
||||
|
||||
### 1. HEDD Integration Example
|
||||
|
||||
```csharp
|
||||
// New service interface
|
||||
public interface IEducationVerifierService
|
||||
{
|
||||
Task<EducationVerificationResult> VerifyDegreeAsync(
|
||||
string candidateName,
|
||||
DateOnly dateOfBirth,
|
||||
string institution,
|
||||
DateOnly? graduationYear,
|
||||
string? qualification,
|
||||
string? subject,
|
||||
string? grade);
|
||||
}
|
||||
|
||||
// New flag categories
|
||||
public enum FlagCategory
|
||||
{
|
||||
Employment,
|
||||
Education, // ✓ Existing
|
||||
Timeline,
|
||||
Plausibility,
|
||||
EducationVerification, // NEW
|
||||
DirectorshipVerification, // NEW
|
||||
HealthcareRegistration, // NEW
|
||||
ProfessionalRegistration // NEW
|
||||
}
|
||||
|
||||
// Example: Enhanced timeline analysis
|
||||
public class TimelineAnalyserService
|
||||
{
|
||||
private const int NormalGapMonths = 3; // UK norm
|
||||
private const int RedFlagGapMonths = 12;
|
||||
|
||||
public TimelineGap CheckGapPlausibility(DateOnly startDate, DateOnly endDate)
|
||||
{
|
||||
if ((endDate - startDate).Days > 366 &&
|
||||
endDate.AddMonths(-NormalGapMonths) < startDate)
|
||||
{
|
||||
return new TimelineGap
|
||||
{
|
||||
Severity = FlagSeverity.Medium,
|
||||
Title = "Unusually Long Employment Gap",
|
||||
Description = "Gap exceeds UK employment pattern norms"
|
||||
};
|
||||
}
|
||||
}
|
||||
}
|
||||
```
|
||||
|
||||
### 2. Healthcare Register Scraper Example
|
||||
|
||||
```csharp
|
||||
public class GMCRegisterVerifier
|
||||
{
|
||||
private const string GMCRegisterUrl = "https://www.gmc-uk.org/";
|
||||
|
||||
public async Task<GMCVerificationResult> VerifyDoctorAsync(
|
||||
string fullName,
|
||||
string gmcNumber = null)
|
||||
{
|
||||
// Web scrape or API query GMC register
|
||||
var result = await ScrapeGMCRegisterAsync(fullName, gmcNumber);
|
||||
|
||||
return new GMCVerificationResult
|
||||
{
|
||||
IsFound = result != null,
|
||||
RegistrationStatus = result?.Status,
|
||||
Specialties = result?.Specialties,
|
||||
Restrictions = result?.Restrictions,
|
||||
VerificationConfidence = result != null ? 95 : 0
|
||||
};
|
||||
}
|
||||
}
|
||||
|
||||
public class NMCRegisterVerifier
|
||||
{
|
||||
public async Task<NMCVerificationResult> VerifyNurseAsync(
|
||||
string fullName,
|
||||
string pinNumber = null)
|
||||
{
|
||||
// Similar pattern to GMC
|
||||
}
|
||||
}
|
||||
```
|
||||
|
||||
### 3. Companies House Director Verification Example
|
||||
|
||||
```csharp
|
||||
public class DirectorshipVerificationService
|
||||
{
|
||||
public async Task<DirectorshipVerificationResult> VerifyDirectorshipAsync(
|
||||
string candidateName,
|
||||
string companyName,
|
||||
DateOnly claimedStartDate,
|
||||
DateOnly claimedEndDate)
|
||||
{
|
||||
// Get company number from existing Companies House integration
|
||||
var company = await _companyVerifier.VerifyCompanyAsync(companyName);
|
||||
|
||||
if (!company.IsVerified)
|
||||
{
|
||||
return CreateUnverifiedResult("Company not found");
|
||||
}
|
||||
|
||||
// Query officer appointments
|
||||
var appointments = await _companiesHouseClient.GetOfficerAppointmentsAsync(
|
||||
company.MatchedCompanyNumber);
|
||||
|
||||
var matchingAppointment = appointments
|
||||
.FirstOrDefault(a => FuzzyMatch(a.OfficerName, candidateName));
|
||||
|
||||
if (matchingAppointment == null)
|
||||
{
|
||||
return CreateFlagResult(
|
||||
"DirectorshipNotFound",
|
||||
$"No officer appointment found for {candidateName}");
|
||||
}
|
||||
|
||||
// Verify dates align
|
||||
if (matchingAppointment.AppointmentDate > claimedStartDate)
|
||||
{
|
||||
return CreateFlagResult(
|
||||
"DirectorshipDateMismatch",
|
||||
$"Claimed start date ({claimedStartDate}) before appointment date");
|
||||
}
|
||||
|
||||
return CreateVerifiedResult(matchingAppointment);
|
||||
}
|
||||
}
|
||||
```
|
||||
|
||||
---
|
||||
|
||||
## Success Metrics for Phase 1
|
||||
|
||||
| Metric | Target | Owner |
|
||||
|---|---|---|
|
||||
| HEDD Integration Live | Week 3 | Engineering |
|
||||
| Education Flags Accuracy | >95% precision | QA |
|
||||
| Timeline Gaps Detected | >80% of actual gaps | Analytics |
|
||||
| GMC/NMC Scraper Complete | Week 4 | Engineering |
|
||||
| Healthcare Niche Adoption | 5+ healthcare recruiter orgs | Sales |
|
||||
| Detection Rate Improvement | +35% over baseline | Product |
|
||||
| User Satisfaction (HEDD) | >85% (low friction) | Support |
|
||||
|
||||
---
|
||||
|
||||
## Risk Mitigation
|
||||
|
||||
### HEDD Integration Risks
|
||||
- **Risk:** API changes or rate limiting
|
||||
- **Mitigation:** Use web portal integration first, request official API later; cache results aggressively
|
||||
- **Risk:** Candidate consent complexity
|
||||
- **Mitigation:** Clear one-click consent flow; educational messaging
|
||||
|
||||
### Professional Register Scraping Risks
|
||||
- **Risk:** Website structure changes break scrapers
|
||||
- **Mitigation:** Robust error handling; monitoring alerts; manual fallback links provided to users
|
||||
- **Risk:** Regulators restrict scraping
|
||||
- **Mitigation:** Request official API access proactively; provide value-add (fraud detection = mutual benefit)
|
||||
|
||||
### HMRC/DBS Integration Risks
|
||||
- **Risk:** Regulatory gatekeeping / approval delays
|
||||
- **Mitigation:** Start vendor conversations NOW; build partnerships in parallel
|
||||
- **Risk:** Compliance burden
|
||||
- **Mitigation:** Partner with established pre-employment screening vendors (Verifile, DDC) who handle compliance
|
||||
|
||||
---
|
||||
|
||||
## Competitive Advantage Summary
|
||||
|
||||
| Feature | TrueCV Advantage | Timeline |
|
||||
|---|---|---|
|
||||
| **HEDD Integration** | Only dedicated CV tool with instant degree verification | Q1 2026 |
|
||||
| **Healthcare Register Targeting** | Only tool targeting healthcare recruitment niche | Q1 2026 |
|
||||
| **Timeline + Education Linking** | CV tells employment started before degree completed = RED FLAG | Q1 2026 |
|
||||
| **Professional Body Framework** | Modular; expandable to 140+ professions vs competitors' static lists | Q2 2026 |
|
||||
| **Companies House Directors** | Only tool verifying self-employment claims against official records | Q1 2026 |
|
||||
|
||||
---
|
||||
|
||||
## UK Market Positioning
|
||||
|
||||
**Tagline:** *"The only CV verification tool UK recruiters need - from degree to directorship"*
|
||||
|
||||
**Market Segment:** Recruitment agencies, HR departments, background screening companies
|
||||
|
||||
**Price Model (Suggested):**
|
||||
- **Free Tier:** Companies House + Timeline Analysis
|
||||
- **Professional Tier:** +HEDD verification, +Healthcare registers (£29-49/user/month)
|
||||
- **Enterprise Tier:** +HMRC payroll, +DBS integration, +Professional bodies (Custom pricing)
|
||||
|
||||
---
|
||||
|
||||
## API Accessibility Summary
|
||||
|
||||
| Source | Type | Access Level | Cost | Feasibility |
|
||||
|---|---|---|---|---|
|
||||
| HEDD | Web Portal + Manual | Registered user | £1-5/check | Easy → Direct |
|
||||
| GMC Register | Public Web | Scrape/No API | Free | Easy → Scraper |
|
||||
| NMC Register | Public Web | Scrape/No API | Free | Easy → Scraper |
|
||||
| Companies House | REST API ✓ | Commercial | Free-£100/mo | Already done |
|
||||
| Directors API | REST API | Commercial | Included | Easy → Extend |
|
||||
| GOV.UK Professions | REST API | Open | Free | Easy → Query |
|
||||
| ICAEW Register | Public Web | Scrape/No API | Free | Medium → Scraper |
|
||||
| SRA Register | Public Web | Scrape/No API | Free | Medium → Scraper |
|
||||
| HMRC RTI | REST API | Restricted | Via partner | Hard → Partnership |
|
||||
| DBS | REST API | Via partner | £20-50/check | Hard → Partnership |
|
||||
|
||||
---
|
||||
|
||||
## Next Steps (This Week)
|
||||
|
||||
1. **Confirm HEDD feasibility** with legal/compliance (consent requirements, data handling)
|
||||
2. **Request GMC/NMC API access** officially (may grant vs. scraping)
|
||||
3. **Map ICAEW/SRA register structures** for scraper design
|
||||
4. **Contact HMRC/DBS vendors** (Verifile, DDC) for partnership exploration
|
||||
5. **UK recruiter interviews:** Validate prioritization with 10-15 target customers
|
||||
6. **Wireframe HEDD UI** in parallel with backend work
|
||||
|
||||
---
|
||||
|
||||
## References
|
||||
|
||||
- [HEDD (Higher Education Degree Datacheck)](https://hedd.ac.uk/)
|
||||
- [GMC Register](https://www.gmc-uk.org/registration-and-licensing/our-registers)
|
||||
- [NMC Register](https://www.nmc.org.uk/registration/search-the-register/)
|
||||
- [UK Regulated Professions Register](https://www.regulated-professions.service.gov.uk/)
|
||||
- [CV Fraud UK Statistics - Cifas](https://www.cifas.org.uk/)
|
||||
- [UK Employment Gaps Report 2025 - LiveCareer](https://www.livecareer.co.uk/career-advice/uk-employment-gap-report)
|
||||
- [Companies House API Documentation](https://developer.companieshouse.gov.uk/)
|
||||
@@ -1,416 +0,0 @@
|
||||
# TrueCV UK Market Strategy & Product Roadmap
|
||||
|
||||
**Document Date:** January 2026
|
||||
**Focus:** UK CV verification market positioning
|
||||
**Horizon:** 12-month growth plan
|
||||
|
||||
---
|
||||
|
||||
## Market Opportunity
|
||||
|
||||
### Problem Statement
|
||||
|
||||
**UK CV fraud costs employers £4.2B+ annually** and is accelerating:
|
||||
|
||||
- **1 in 5 candidates** claim false university degrees (Cifas, 2025)
|
||||
- **40% of CV embellishments** relate to qualifications
|
||||
- **24% of screened CVs** fail verification (Reed Screening, 2025)
|
||||
- **AI-generated fraud emerging:** Deepfakes, synthetic identities, proxy interviews now feasible
|
||||
- **Regulatory risk:** Companies failing due diligence face legal liability in regulated sectors
|
||||
|
||||
**Traditional Pre-Employment Screening is Broken:**
|
||||
- Manual background checks take 5-10 days
|
||||
- Education verification requires contacting universities individually (10 days+)
|
||||
- Professional registration checks vary by profession with no central access
|
||||
- No integrated view across employment, education, and professional credentials
|
||||
|
||||
---
|
||||
|
||||
## Market Size & Addressable Opportunity
|
||||
|
||||
### TAM (Total Addressable Market)
|
||||
|
||||
**UK Recruitment Market Segment:**
|
||||
- **190,000 recruitment companies** in UK (2024)
|
||||
- **~3,500+ recruiting via dedicated screening tools**
|
||||
- **Estimated £2.8B spent on background screening annually**
|
||||
|
||||
### SAM (Serviceable Addressable Market)
|
||||
|
||||
**TrueCV Target Segment:**
|
||||
- Mid-market recruitment agencies (50-500 staff): ~800 companies
|
||||
- Corporate HR departments (100+ employees): ~15,000 companies
|
||||
- Specialist vertical recruiters (healthcare, finance, legal): ~2,500 companies
|
||||
- **Total TAM:** ~18,300 potential customers
|
||||
|
||||
**Estimated SAM value at £180/customer/year:** ~£3.3M annually
|
||||
|
||||
### SOM (Serviceable Obtainable Market) - Year 1
|
||||
|
||||
- **Target:** 50-100 customers at £50-200/month (various tiers)
|
||||
- **Projected revenue:** £30-240K in Year 1
|
||||
- **Growth trajectory:** Doubling annually if market adoption strong
|
||||
|
||||
---
|
||||
|
||||
## Competitive Landscape
|
||||
|
||||
### Current Competitors
|
||||
|
||||
| Competitor | Coverage | Strength | Weakness |
|
||||
|---|---|---|---|
|
||||
| **Workable** | ATS + basic screening | Broad platform | No CV verification focus |
|
||||
| **Deel** | Global hiring + screening | Compliance authority | Not UK-focused; expensive |
|
||||
| **Checkr** | Background checks + DBS | Scale and integrations | No CV-specific verification |
|
||||
| **Verifile** | Pre-employment screening | Established relationships | Traditional manual process |
|
||||
| **Veriff** | Identity verification | Strong deepfake tech | Not employment-focused |
|
||||
|
||||
### TrueCV Differentiation
|
||||
|
||||
| Feature | TrueCV | Workable | Deel | Checkr | Verifile |
|
||||
|---|---|---|---|---|---|
|
||||
| **Degree Verification (HEDD)** | ✅ Q1 2026 | ❌ | ❌ | ❌ | ❌ |
|
||||
| **Healthcare Register Checks** | ✅ Q1 2026 | ❌ | ❌ | ❌ | ❌ |
|
||||
| **Timeline Fraud Detection** | ✅ Q1 2026 | ❌ | ❌ | ❌ | ❌ |
|
||||
| **Director Verification** | ✅ Q1 2026 | ❌ | ❌ | ❌ | ❌ |
|
||||
| **Companies House API** | ✅ | ❌ | ❌ | ❌ | ❌ |
|
||||
| **Professional Bodies** | ✅ Q2 2026 | ❌ | ❌ | Partial | Partial |
|
||||
| **DBS Integration** | ✅ Q3 2026 | ❌ | ✅ | ✅ | ✅ |
|
||||
|
||||
**Key Advantage:** *First-to-market with CV-specific, UK-integrated verification stack*
|
||||
|
||||
---
|
||||
|
||||
## Product Strategy
|
||||
|
||||
### Phase 1 (Q1 2026): MVP Launch - "The Verified CV"
|
||||
|
||||
**Positioning:** "Every UK degree verified. Every timeline verified. Every claim validated."
|
||||
|
||||
**Core Features (8 weeks):**
|
||||
1. HEDD degree verification (real-time + manual review tracking)
|
||||
2. Timeline fraud detection (overlaps, gaps, education-employment sequencing)
|
||||
3. Companies House director verification
|
||||
4. GMC/NMC healthcare register checks
|
||||
5. Enhanced CV parsing (education/employment entity linking)
|
||||
|
||||
**Target Customer:** Medium recruitment agencies (50-200 hiring/year)
|
||||
|
||||
**Pricing Model:**
|
||||
- **Freemium:** 3 free CV checks/month (companies house + timeline)
|
||||
- **Professional:** £49/month - Unlimited checks + HEDD verification
|
||||
- **Enterprise:** £199/month - Pro features + API access + custom integrations
|
||||
|
||||
**Launch Strategy:**
|
||||
- Partner with 3-5 recruitment agencies for beta testing (Week 2-4)
|
||||
- Launch public beta (Week 5)
|
||||
- GA release (Week 8)
|
||||
- Press/analyst outreach highlighting fraud prevention angle
|
||||
|
||||
**Success Metrics:**
|
||||
- 500+ signups in first 4 weeks
|
||||
- 10%+ weekly active check rate
|
||||
- 85%+ feature satisfaction (NPS >40)
|
||||
|
||||
---
|
||||
|
||||
### Phase 2 (Q2 2026): Professional Bodies Expansion
|
||||
|
||||
**Positioning:** "Verify degrees. Verify certifications. Verify everything."
|
||||
|
||||
**New Features:**
|
||||
1. ICAEW accountant registration checks
|
||||
2. SRA solicitor registration checks
|
||||
3. IET engineer registration checks
|
||||
4. RIBA architect registration checks
|
||||
5. GOV.UK regulated profession enrichment (API layer)
|
||||
|
||||
**Target Market Expansion:**
|
||||
- Financial services recruiting
|
||||
- Legal recruiting
|
||||
- Engineering recruiting
|
||||
- Niche vertical specialists
|
||||
|
||||
**Business Impact:**
|
||||
- +40% monthly active users
|
||||
- +3x engagement (more verifications per customer)
|
||||
- +2x ARPU (professional tier premium)
|
||||
|
||||
**Pricing:** Professional tier → £79/month; Enterprise → £249/month
|
||||
|
||||
---
|
||||
|
||||
### Phase 3 (Q3 2026): Compliance & Regulatory
|
||||
|
||||
**Positioning:** "Full employment verification. Complete compliance confidence."
|
||||
|
||||
**New Features:**
|
||||
1. HMRC payroll verification (partnership model)
|
||||
2. DBS check integration (partnership + commission)
|
||||
3. Right-to-Work verification API
|
||||
4. Audit trail & compliance reporting
|
||||
5. Batch processing API
|
||||
|
||||
**Target Markets:**
|
||||
- Large corporate HR departments
|
||||
- Pre-employment screening agencies
|
||||
- Temp/staffing agencies (compliance-heavy)
|
||||
|
||||
**Business Model Evolution:**
|
||||
- Per-check commission on DBS (£5-15 per check)
|
||||
- HMRC verification licensing (custom pricing)
|
||||
- API/platform access (£500-2,000/month)
|
||||
|
||||
---
|
||||
|
||||
## Go-To-Market Strategy
|
||||
|
||||
### Sales Channels
|
||||
|
||||
#### Channel 1: Direct Sales (Lead)
|
||||
- Target recruitment agency owners (LinkedIn outreach)
|
||||
- HR directors at 100+ employee companies
|
||||
- Sales pitch: "Reduce hiring risk. Verify every claim. In minutes."
|
||||
- Expected conversion: 5-8% from qualified leads
|
||||
- Sales cycle: 2-4 weeks
|
||||
|
||||
#### Channel 2: Partnerships
|
||||
- Integrate with ATS platforms (Workable, Bullhorn, Lever)
|
||||
- White-label for existing background check providers
|
||||
- API marketplace (Zapier, Make, etc.)
|
||||
- Expected impact: +30% user acquisition annually
|
||||
|
||||
#### Channel 3: Content & SEO
|
||||
- Blog: "UK CV Fraud Patterns" (targeting "CV verification UK" search)
|
||||
- Case studies: "How we caught 18 fake degrees in Q1"
|
||||
- Thought leadership: Webinars on fraud detection for HR
|
||||
- Expected impact: +20% organic users
|
||||
|
||||
#### Channel 4: Vertical Specialists
|
||||
- Healthcare recruiter outreach (GMC/NMC checks as entry)
|
||||
- Financial services (ICAEW verification)
|
||||
- Legal recruiting (SRA verification)
|
||||
- Expected impact: +25% high-value customers
|
||||
|
||||
### Marketing Messaging
|
||||
|
||||
**Tagline:** "Hire with Confidence. Verify with TrueCV."
|
||||
|
||||
**Core Messages:**
|
||||
1. **For Recruiters:** "Catch 90% of degree fraud in seconds. One-click HEDD verification."
|
||||
2. **For HR Teams:** "Complete CV validation pipeline. Reduce hiring risk by 70%."
|
||||
3. **For Compliance:** "Full audit trail. DBS integration. Regulatory confidence."
|
||||
|
||||
**Proof Points:**
|
||||
- "Trusted by 5+ UK recruitment agencies in first 30 days"
|
||||
- "1 in 5 candidates have false degrees — we find them"
|
||||
- "Average savings: £8,000 per bad hire prevented"
|
||||
|
||||
---
|
||||
|
||||
## Pricing Strategy
|
||||
|
||||
### Tier Analysis
|
||||
|
||||
| Tier | Users | Monthly | Annual | Features |
|
||||
|---|---|---|---|---|
|
||||
| **Free** | Solo recruiters | £0 | £0 | 3 CV checks, Companies House |
|
||||
| **Professional** | Small agencies | £49 | £490 | Unlimited checks, HEDD, Timeline |
|
||||
| **Enterprise** | Large orgs | £199 | £1,990 | API access, custom integrations, DBS |
|
||||
| **API/Platform** | Integration partners | £500-2K | £6-24K | Batch processing, white-label |
|
||||
|
||||
### Unit Economics (Target - Year 2)
|
||||
|
||||
- **Customer Acquisition Cost (CAC):** £150-300 (organic/partner-led)
|
||||
- **Average Revenue Per User (ARPU):** £60-120/month (mix of tiers)
|
||||
- **Payback Period:** 2-4 months
|
||||
- **Gross Margin:** 75-80% (SaaS model)
|
||||
- **LTV:CAC Ratio:** 4:1+ (healthy SaaS)
|
||||
|
||||
---
|
||||
|
||||
## Organizational Requirements
|
||||
|
||||
### Team Structure (12-month horizon)
|
||||
|
||||
**Now (Q1):**
|
||||
- 2 Backend Engineers (full-time on Phase 1)
|
||||
- 1 QA Engineer
|
||||
- 1 Product Manager
|
||||
- 1 Marketing/Growth Lead
|
||||
|
||||
**Q2 Addition:**
|
||||
- +1 Full-stack Engineer (vertical expansion)
|
||||
- +1 Sales/BD Lead (partnership development)
|
||||
|
||||
**Q3 Addition:**
|
||||
- +1 Customer Success Manager (onboarding)
|
||||
- +1 Part-time Data Analyst (metrics/LTV)
|
||||
|
||||
---
|
||||
|
||||
## Key Risks & Mitigations
|
||||
|
||||
| Risk | Probability | Impact | Mitigation |
|
||||
|---|---|---|---|
|
||||
| **HEDD API access delayed** | Medium | High | Use web portal integration; request API access in parallel |
|
||||
| **NHS/GMC scraping blocked** | Low | Medium | Request official API access proactively; provide value-add |
|
||||
| **Regulatory gatekeeping** | Medium | Medium | Build partnerships early; engage with regulators directly |
|
||||
| **DBS/HMRC integration delays** | Medium | Medium | Partner with established vendors (Verifile, DDC) handling compliance |
|
||||
| **Market adoption slower than expected** | Medium | Medium | Focus on high-value verticals first (healthcare, finance); expand TAM gradually |
|
||||
| **Competitor response** | Medium | Medium | Maintain first-mover advantage; deepen integrations; expand internationally (Ireland, Australia next) |
|
||||
|
||||
---
|
||||
|
||||
## Success Metrics (12-Month Goals)
|
||||
|
||||
### Business Metrics
|
||||
- **Revenue:** £250K+ annualized (Mix of Professional/Enterprise)
|
||||
- **Customers:** 50-75 paying customers
|
||||
- **Monthly Recurring Revenue (MRR):** £20K+
|
||||
- **CAC Payback:** <4 months
|
||||
- **NPS:** >50 (positive)
|
||||
|
||||
### Product Metrics
|
||||
- **HEDD Verification Accuracy:** >98% match rate
|
||||
- **Timeline Detection Rate:** 85%+ of actual gaps/overlaps caught
|
||||
- **Directorship Verification:** 95%+ accuracy (vs. Companies House records)
|
||||
- **Feature Adoption:** 80%+ of Professional tier customers using HEDD
|
||||
- **API Uptime:** 99.9%
|
||||
|
||||
### Market Metrics
|
||||
- **Brand Awareness:** 15%+ of recruitment agencies aware of TrueCV
|
||||
- **Market Share:** 0.5-1% of addressable recruitment screening market
|
||||
- **Vertical Penetration:** 3%+ of healthcare recruiters, 2%+ financial recruiters
|
||||
|
||||
---
|
||||
|
||||
## Financial Projections
|
||||
|
||||
### Conservative Scenario (50 customers by end-of-year)
|
||||
|
||||
**Revenue Breakdown:**
|
||||
- 30 × Professional tier at £49/mo: £1,470/mo
|
||||
- 15 × Enterprise tier at £199/mo: £2,985/mo
|
||||
- 5 × API/Platform at £1,000/mo: £5,000/mo
|
||||
- **Total MRR (Dec 2026):** £9,455
|
||||
- **Annualized:** £113,460
|
||||
|
||||
**Costs:**
|
||||
- Engineering (2 FTE): £150K/year
|
||||
- Infrastructure/APIs: £20K/year
|
||||
- Sales/Marketing: £30K/year
|
||||
- Operations: £20K/year
|
||||
- **Total Cost:** £220K/year
|
||||
|
||||
**Result:** Break-even at ~24 customers; profitable at 50+ customers
|
||||
|
||||
### Growth Scenario (100 customers by end-of-year)
|
||||
|
||||
- **MRR (Dec 2026):** £18,910
|
||||
- **Annualized Revenue:** £226,920
|
||||
- **Gross Margin:** 75% = £170K+ operational profit
|
||||
|
||||
---
|
||||
|
||||
## Next 30 Days Action Plan
|
||||
|
||||
### Week 1-2: Preparation
|
||||
- [ ] Contact HEDD for API access / partner discussions
|
||||
- [ ] Reach out to GMC/NMC about verification APIs
|
||||
- [ ] Identify 5 recruitment agency beta partners
|
||||
- [ ] Finalize HEDD compliance & consent workflows
|
||||
|
||||
### Week 2-4: Development
|
||||
- [ ] Complete HEDD integration (see Phase 1 technical doc)
|
||||
- [ ] GMC/NMC scraper development
|
||||
- [ ] Enhanced timeline analysis
|
||||
- [ ] Companies House director verification
|
||||
|
||||
### Week 3-4: Beta & Validation
|
||||
- [ ] Beta launch with 3-5 agencies
|
||||
- [ ] Collect feedback on UX/value
|
||||
- [ ] Measure fraud detection accuracy
|
||||
- [ ] Iterate on flag messaging/severity
|
||||
|
||||
### Week 4+: Go-to-Market
|
||||
- [ ] Public launch announcement
|
||||
- [ ] Initial outreach to 20-30 qualified prospects
|
||||
- [ ] Content marketing (first blog post live)
|
||||
- [ ] Track signup rate & activation
|
||||
|
||||
---
|
||||
|
||||
## Long-Term Vision (2-3 Years)
|
||||
|
||||
**Expansion Opportunities Beyond UK:**
|
||||
|
||||
### Ireland (Natural Extension)
|
||||
- Similar legal framework to UK
|
||||
- HEDD equivalent exists (HEA)
|
||||
- Revenue opportunity: +£50-100K annually
|
||||
|
||||
### Australia/New Zealand
|
||||
- English-speaking markets
|
||||
- Similar professional regulation frameworks
|
||||
- Revenue opportunity: +£150-300K annually
|
||||
|
||||
### EU Markets (Longer-term)
|
||||
- Different regulatory landscape (more complex)
|
||||
- ENIC-NARIC degree verification network
|
||||
- Professional body registration varies by country
|
||||
|
||||
### Vertical Integrations
|
||||
- HR software integrations (Workday, SAP SuccessFactors)
|
||||
- Talent acquisition platforms (multi-tool suites)
|
||||
- Compliance software (audit logging, reporting)
|
||||
|
||||
---
|
||||
|
||||
## Conclusion
|
||||
|
||||
TrueCV addresses a massive UK market problem (£4.2B+ annual cost from CV fraud) with a focused, integrated solution. By launching with HEDD degree verification + timeline fraud detection in Q1 2026, we capture first-mover advantage in a gap no competitor fills.
|
||||
|
||||
**The opportunity:** Become the UK's trusted CV verification layer for recruitment, reducing fraud while accelerating hiring processes.
|
||||
|
||||
**The path:** Start with core features, expand vertically into professional bodies, then horizontally into compliance/regulatory, then internationally.
|
||||
|
||||
**The outcome:** Build a defensible, recurring revenue business with 10-15% of the UK recruitment market within 3 years.
|
||||
|
||||
---
|
||||
|
||||
## Appendix: Customer Personas
|
||||
|
||||
### Persona 1: Agency Owner (Mid-Market)
|
||||
- **Name:** Sarah, 48, runs recruitment agency (80 staff)
|
||||
- **Problem:** Wasting 2-3 hours per hire verifying degrees manually
|
||||
- **Budget:** £3K-8K/year on screening tools
|
||||
- **Decision-making:** Speed & cost focus; wants manual verification eliminated
|
||||
- **Buying signal:** "Can you reduce our verification time from 5 days to 5 minutes?"
|
||||
|
||||
### Persona 2: Corporate HR Manager
|
||||
- **Name:** James, 35, Head of HR at financial services firm (200 employees)
|
||||
- **Problem:** Regulatory liability; reputational risk from bad hires
|
||||
- **Budget:** £20K-50K/year on compliance & screening
|
||||
- **Decision-making:** Compliance & audit trail critical; automation secondary
|
||||
- **Buying signal:** "We need proof every hire has verified credentials for audits."
|
||||
|
||||
### Persona 3: Specialist Vertical Recruiter
|
||||
- **Name:** Dr. Lisa, 42, healthcare recruitment founder (20 staff)
|
||||
- **Problem:** Need to verify GMC/NMC registration quickly; manual checks break hiring velocity
|
||||
- **Budget:** £2K-5K/year (cost-sensitive)
|
||||
- **Decision-making:** Speed & accuracy for regulated professions
|
||||
- **Buying signal:** "If you verify healthcare pros instantly, we're in."
|
||||
|
||||
---
|
||||
|
||||
## References & Data Sources
|
||||
|
||||
- [CIFAS CV Fraud Report](https://www.cifas.org.uk/newsroom/1-in-5-lie-about-uni-degree-cv-fraud)
|
||||
- [Reed Screening CV Verification Data](https://www.reed.com/)
|
||||
- [UK Employment Gap Report 2025](https://www.livecareer.co.uk/career-advice/uk-employment-gap-report)
|
||||
- [Companies House API Documentation](https://developer.companieshouse.gov.uk/)
|
||||
- [HEDD (Higher Education Degree Datacheck)](https://hedd.ac.uk/)
|
||||
- [GMC Register](https://www.gmc-uk.org/registration-and-licensing/our-registers)
|
||||
- [NMC Register](https://www.nmc.org.uk/registration/search-the-register/)
|
||||
|
||||
161
deploy/README.md
@@ -1,161 +0,0 @@
|
||||
# TrueCV Deployment Guide
|
||||
|
||||
## Quick Start
|
||||
|
||||
### 1. Server Setup (run once on fresh Ubuntu server)
|
||||
|
||||
```bash
|
||||
# Copy server-setup.sh to your server
|
||||
scp deploy/server-setup.sh user@your-server:/tmp/
|
||||
|
||||
# SSH into server and run setup
|
||||
ssh user@your-server
|
||||
sudo bash /tmp/server-setup.sh
|
||||
```
|
||||
|
||||
**Before running**, edit the script and update:
|
||||
- `DOMAIN` - Your domain name
|
||||
- `DB_PASSWORD` - Strong password for SQL Server
|
||||
- `ADMIN_EMAIL` - Email for SSL certificate notifications
|
||||
|
||||
### 2. Deploy Application (run from dev machine)
|
||||
|
||||
```bash
|
||||
# Edit deploy.sh and update configuration
|
||||
nano deploy/deploy.sh
|
||||
|
||||
# Make executable and run
|
||||
chmod +x deploy/deploy.sh
|
||||
./deploy/deploy.sh
|
||||
```
|
||||
|
||||
**Update these values in deploy.sh:**
|
||||
- `SERVER_USER` - SSH username
|
||||
- `SERVER_HOST` - Server hostname or IP
|
||||
- `DOMAIN` - Your domain name
|
||||
|
||||
### 3. Enable SSL
|
||||
|
||||
After DNS is configured and app is deployed:
|
||||
|
||||
```bash
|
||||
ssh user@your-server
|
||||
sudo certbot --nginx -d truecv.yourdomain.com
|
||||
```
|
||||
|
||||
## Configuration
|
||||
|
||||
### Environment Variables
|
||||
|
||||
The systemd service sets these environment variables:
|
||||
- `ASPNETCORE_ENVIRONMENT=Production`
|
||||
- `ASPNETCORE_URLS=http://localhost:5000`
|
||||
- `ConnectionStrings__DefaultConnection=...`
|
||||
|
||||
To add more (like API keys), edit:
|
||||
```bash
|
||||
sudo systemctl edit truecv
|
||||
```
|
||||
|
||||
Add:
|
||||
```ini
|
||||
[Service]
|
||||
Environment=OpenAI__ApiKey=your-key-here
|
||||
```
|
||||
|
||||
### appsettings.Production.json
|
||||
|
||||
For sensitive settings, create `/var/www/truecv/appsettings.Production.json`:
|
||||
|
||||
```json
|
||||
{
|
||||
"ConnectionStrings": {
|
||||
"DefaultConnection": "Server=127.0.0.1;Database=TrueCV;User Id=SA;Password=YourPassword;TrustServerCertificate=True"
|
||||
},
|
||||
"OpenAI": {
|
||||
"ApiKey": "your-openai-key"
|
||||
}
|
||||
}
|
||||
```
|
||||
|
||||
## Maintenance
|
||||
|
||||
### View Logs
|
||||
```bash
|
||||
# Application logs
|
||||
sudo journalctl -u truecv -f
|
||||
|
||||
# Nginx logs
|
||||
sudo tail -f /var/log/nginx/access.log
|
||||
sudo tail -f /var/log/nginx/error.log
|
||||
|
||||
# SQL Server logs
|
||||
docker logs truecv-sql -f
|
||||
```
|
||||
|
||||
### Restart Services
|
||||
```bash
|
||||
sudo systemctl restart truecv
|
||||
sudo systemctl restart nginx
|
||||
docker restart truecv-sql
|
||||
```
|
||||
|
||||
### Database Backup
|
||||
```bash
|
||||
# Backup
|
||||
docker exec truecv-sql /opt/mssql-tools18/bin/sqlcmd \
|
||||
-S localhost -U SA -P 'YourPassword' -C \
|
||||
-Q "BACKUP DATABASE TrueCV TO DISK='/var/opt/mssql/backup/truecv.bak'"
|
||||
|
||||
# Copy backup from container
|
||||
docker cp truecv-sql:/var/opt/mssql/backup/truecv.bak ./truecv-backup.bak
|
||||
```
|
||||
|
||||
### Rollback Deployment
|
||||
```bash
|
||||
# On server - restore previous version
|
||||
sudo systemctl stop truecv
|
||||
sudo rm -rf /var/www/truecv
|
||||
sudo mv /var/www/truecv.backup.YYYYMMDD_HHMMSS /var/www/truecv
|
||||
sudo systemctl start truecv
|
||||
```
|
||||
|
||||
## Troubleshooting
|
||||
|
||||
### App won't start
|
||||
```bash
|
||||
# Check status
|
||||
sudo systemctl status truecv
|
||||
|
||||
# Check logs
|
||||
sudo journalctl -u truecv -n 100
|
||||
|
||||
# Test manually
|
||||
cd /var/www/truecv
|
||||
sudo -u www-data dotnet TrueCV.Web.dll
|
||||
```
|
||||
|
||||
### Database connection issues
|
||||
```bash
|
||||
# Check SQL Server is running
|
||||
docker ps | grep truecv-sql
|
||||
|
||||
# Test connection
|
||||
docker exec -it truecv-sql /opt/mssql-tools18/bin/sqlcmd \
|
||||
-S localhost -U SA -P 'YourPassword' -C \
|
||||
-Q "SELECT name FROM sys.databases"
|
||||
```
|
||||
|
||||
### Blazor SignalR issues
|
||||
Ensure Nginx is configured for WebSocket support (included in setup script).
|
||||
|
||||
Check browser console for connection errors.
|
||||
|
||||
## Security Checklist
|
||||
|
||||
- [ ] Change default SQL Server password
|
||||
- [ ] Enable SSL with Let's Encrypt
|
||||
- [ ] Configure firewall (UFW)
|
||||
- [ ] Set up automated backups
|
||||
- [ ] Enable fail2ban for SSH protection
|
||||
- [ ] Keep system updated regularly
|
||||
|
Before Width: | Height: | Size: 254 MiB |
|
Before Width: | Height: | Size: 254 MiB |
|
Before Width: | Height: | Size: 7.9 MiB |
|
Before Width: | Height: | Size: 254 MiB |
|
Before Width: | Height: | Size: 7.9 MiB |
|
Before Width: | Height: | Size: 254 MiB |
448
src/RealCV.Application/Data/UKHistoricalEmployers.cs
Normal file
@@ -0,0 +1,448 @@
|
||||
namespace RealCV.Application.Data;
|
||||
|
||||
/// <summary>
|
||||
/// Database of historical UK employers that may no longer exist under their original names.
|
||||
/// Includes companies that were acquired, merged, dissolved, or renamed.
|
||||
/// Also includes public sector bodies and internal divisions of larger organisations.
|
||||
/// </summary>
|
||||
public static class UKHistoricalEmployers
|
||||
{
|
||||
/// <summary>
|
||||
/// Maps historical company names to their current/successor company information.
|
||||
/// Key: Historical name (case-insensitive)
|
||||
/// Value: HistoricalEmployerInfo with successor details
|
||||
/// </summary>
|
||||
public static readonly Dictionary<string, HistoricalEmployerInfo> HistoricalCompanies =
|
||||
new(StringComparer.OrdinalIgnoreCase)
|
||||
{
|
||||
// Engineering & Construction
|
||||
["Foster Wheeler"] = new("Wood Group / AMEC Foster Wheeler", "Engineering contractor acquired by AMEC in 2014, now part of Wood Group", "00163609"),
|
||||
["Foster Wheeler Ltd"] = new("Wood Group / AMEC Foster Wheeler", "Engineering contractor acquired by AMEC in 2014, now part of Wood Group", "00163609"),
|
||||
["Foster Wheeler Limited"] = new("Wood Group / AMEC Foster Wheeler", "Engineering contractor acquired by AMEC in 2014, now part of Wood Group", "00163609"),
|
||||
["Foster Wheeler PLC"] = new("Wood Group / AMEC Foster Wheeler", "Engineering contractor acquired by AMEC in 2014, now part of Wood Group", "00163609"),
|
||||
["Sir Alexander Gibb and Partners"] = new("Jacobs Engineering", "Historic engineering consultancy (founded 1922), acquired by Jacobs", null),
|
||||
["Alexander Gibb and Partners"] = new("Jacobs Engineering", "Historic engineering consultancy (founded 1922), acquired by Jacobs", null),
|
||||
["Gibb and Partners"] = new("Jacobs Engineering", "Historic engineering consultancy, acquired by Jacobs", null),
|
||||
["Mott MacDonald"] = new("Mott MacDonald", "Still trading - major engineering consultancy", "01243967"),
|
||||
["Ove Arup"] = new("Arup", "Still trading as Arup", "01312453"),
|
||||
["Arup"] = new("Arup", "Major engineering consultancy", "01312453"),
|
||||
["WS Atkins"] = new("SNC-Lavalin / Atkins", "Acquired by SNC-Lavalin in 2017", "01885586"),
|
||||
["Atkins"] = new("SNC-Lavalin / Atkins", "Acquired by SNC-Lavalin in 2017", "01885586"),
|
||||
|
||||
// Pharmaceuticals
|
||||
["Glaxo"] = new("GlaxoSmithKline (GSK)", "Merged with SmithKline Beecham in 2000 to form GSK", "03888792"),
|
||||
["Glaxo Research & Development"] = new("GlaxoSmithKline (GSK)", "Glaxo R&D subsidiary, merged into GSK in 2000", "03888792"),
|
||||
["Glaxo Research & Development Ltd"] = new("GlaxoSmithKline (GSK)", "Glaxo R&D subsidiary, merged into GSK in 2000", "03888792"),
|
||||
["Glaxo Research and Development"] = new("GlaxoSmithKline (GSK)", "Glaxo R&D subsidiary, merged into GSK in 2000", "03888792"),
|
||||
["Glaxo Wellcome"] = new("GlaxoSmithKline (GSK)", "Formed 1995 (Glaxo + Wellcome), merged with SmithKline Beecham 2000", "03888792"),
|
||||
["SmithKline Beecham"] = new("GlaxoSmithKline (GSK)", "Merged with Glaxo Wellcome in 2000 to form GSK", "03888792"),
|
||||
["Beecham"] = new("GlaxoSmithKline (GSK)", "Merged to form SmithKline Beecham, then GSK", "03888792"),
|
||||
["Wellcome"] = new("GlaxoSmithKline (GSK)", "Acquired by Glaxo in 1995", "03888792"),
|
||||
["ICI Pharmaceuticals"] = new("AstraZeneca", "ICI pharma division became Zeneca, merged with Astra 1999", "02723534"),
|
||||
["Zeneca"] = new("AstraZeneca", "Merged with Astra in 1999", "02723534"),
|
||||
|
||||
// Banking & Finance (historical names)
|
||||
["Midland Bank"] = new("HSBC UK", "Acquired by HSBC in 1992", "00014259"),
|
||||
["National Westminster Bank"] = new("NatWest (RBS Group)", "Acquired by RBS in 2000", "00929027"),
|
||||
["NatWest"] = new("NatWest Group", "Part of NatWest Group (formerly RBS)", "00929027"),
|
||||
["Lloyds Bank"] = new("Lloyds Banking Group", "Part of Lloyds Banking Group", "00002065"),
|
||||
["Lloyds TSB"] = new("Lloyds Banking Group", "Rebranded to Lloyds Bank in 2013", "00002065"),
|
||||
["TSB"] = new("TSB Bank", "Demerged from Lloyds in 2013, acquired by Sabadell", "SC205310"),
|
||||
["Halifax"] = new("Halifax (Lloyds Banking Group)", "Part of Lloyds Banking Group since 2009", "02367076"),
|
||||
["HBOS"] = new("Lloyds Banking Group", "Acquired by Lloyds in 2009", "SC218813"),
|
||||
["Bank of Scotland"] = new("Bank of Scotland (Lloyds Banking Group)", "Part of Lloyds Banking Group", "SC327000"),
|
||||
["Abbey National"] = new("Santander UK", "Acquired by Santander in 2004", "02294747"),
|
||||
["Alliance & Leicester"] = new("Santander UK", "Acquired by Santander in 2008", "03263713"),
|
||||
["Bradford & Bingley"] = new("Santander UK (savings) / UKAR (mortgages)", "Nationalised 2008, split up", "00189520"),
|
||||
["Northern Rock"] = new("Virgin Money UK", "Nationalised 2008, sold to Virgin Money 2012", "03273685"),
|
||||
|
||||
// Retail
|
||||
["Woolworths"] = new("Dissolved", "UK Woolworths went into administration in 2008", "00106966"),
|
||||
["British Home Stores"] = new("Dissolved", "BHS went into administration in 2016", "00229606"),
|
||||
["BHS"] = new("Dissolved", "BHS went into administration in 2016", "00229606"),
|
||||
["Littlewoods"] = new("Shop Direct / The Very Group", "Stores closed, online business continued", null),
|
||||
["Comet"] = new("Dissolved", "Electrical retailer went into administration in 2012", "00abortedte"),
|
||||
["MFI"] = new("Dissolved", "Furniture retailer went into administration in 2008", null),
|
||||
["Courts"] = new("Dissolved", "Furniture retailer ceased UK operations", null),
|
||||
["Safeway"] = new("Morrisons", "UK stores acquired by Morrisons in 2004", "00358949"),
|
||||
["Kwik Save"] = new("Dissolved", "Supermarket chain dissolved in 2007", null),
|
||||
["Fine Fare"] = new("Dissolved", "Supermarket chain - stores sold to various buyers", null),
|
||||
["Gateway"] = new("Somerfield / Co-op", "Became Somerfield, then acquired by Co-op", null),
|
||||
["Somerfield"] = new("Co-operative Group", "Acquired by Co-op in 2009", null),
|
||||
|
||||
// Telecoms
|
||||
["British Telecom"] = new("BT Group", "Rebranded to BT", "01800000"),
|
||||
["GPO Telephones"] = new("BT Group", "Became British Telecom, then BT", "01800000"),
|
||||
["Mercury Communications"] = new("Cable & Wireless / Vodafone", "Merged into Cable & Wireless, later Vodafone", null),
|
||||
["Cellnet"] = new("O2 (Virgin Media O2)", "Became BT Cellnet, then O2", null),
|
||||
["Orange"] = new("EE (BT)", "Merged with T-Mobile to form EE, acquired by BT", null),
|
||||
["T-Mobile UK"] = new("EE (BT)", "Merged with Orange to form EE", null),
|
||||
["One2One"] = new("EE (BT)", "Became T-Mobile UK, then EE", null),
|
||||
|
||||
// Utilities
|
||||
["Central Electricity Generating Board"] = new("National Grid / Various generators", "CEGB privatised and split in 1990", null),
|
||||
["CEGB"] = new("National Grid / Various generators", "CEGB privatised and split in 1990", null),
|
||||
["British Gas"] = new("Centrica / National Grid", "Demerged in 1997", "00029782"),
|
||||
["Eastern Electricity"] = new("EDF Energy", "Privatised, now part of EDF", null),
|
||||
["London Electricity"] = new("EDF Energy", "Privatised, now part of EDF", null),
|
||||
["SEEBOARD"] = new("EDF Energy", "Privatised, now part of EDF", null),
|
||||
["PowerGen"] = new("E.ON UK", "Acquired by E.ON", null),
|
||||
["National Power"] = new("RWE npower / Innogy", "Split and acquired", null),
|
||||
|
||||
// Manufacturing & Industrial
|
||||
["British Steel"] = new("Tata Steel UK / British Steel (2016)", "Privatised, acquired by Corus then Tata, British Steel name revived 2016", "12303256"),
|
||||
["British Steel Corporation"] = new("Tata Steel UK / British Steel (2016)", "Nationalised steel industry, privatised 1988", "12303256"),
|
||||
["British Steel plc"] = new("Tata Steel UK / British Steel (2016)", "Merged with Hoogovens to form Corus 1999", "12303256"),
|
||||
["Corus"] = new("Tata Steel UK", "Acquired by Tata Steel in 2007", null),
|
||||
["British Leyland"] = new("Various (BMW, Tata, etc.)", "Split up - brands went to various owners", null),
|
||||
["Rover Group"] = new("Dissolved", "Final owner MG Rover went bankrupt 2005", null),
|
||||
["MG Rover"] = new("Dissolved", "Went into administration in 2005", null),
|
||||
["Austin Rover"] = new("Dissolved", "Part of British Leyland, became Rover Group", null),
|
||||
["British Aerospace"] = new("BAE Systems", "Merged with Marconi Electronic Systems in 1999", "01470151"),
|
||||
["BAe"] = new("BAE Systems", "Merged with Marconi Electronic Systems in 1999", "01470151"),
|
||||
["Marconi"] = new("BAE Systems / Ericsson", "Defence division to BAE, telecoms to Ericsson", null),
|
||||
["GEC"] = new("Various", "General Electric Company (UK) - broken up", null),
|
||||
["GEC Marconi"] = new("BAE Systems", "Defence business became part of BAE Systems", "01470151"),
|
||||
["Plessey"] = new("Siemens / various", "Broken up in 1989", null),
|
||||
["ICL"] = new("Fujitsu", "Acquired by Fujitsu", null),
|
||||
["International Computers Limited"] = new("Fujitsu", "Acquired by Fujitsu in 2002", null),
|
||||
["Ferranti"] = new("Dissolved", "Collapsed in 1993 after fraud scandal", null),
|
||||
|
||||
// Oil & Gas
|
||||
["British Petroleum"] = new("BP", "Rebranded to BP", "00102498"),
|
||||
["BP Amoco"] = new("BP", "Merged 1998, rebranded to just BP", "00102498"),
|
||||
["Enterprise Oil"] = new("Shell", "Acquired by Shell in 2002", null),
|
||||
["Lasmo"] = new("Eni", "Acquired by Eni in 2001", null),
|
||||
["Britoil"] = new("BP", "Acquired by BP in 1988", null),
|
||||
|
||||
// Transport
|
||||
["British Rail"] = new("Various (Network Rail, TOCs)", "Privatised and split in 1990s", null),
|
||||
["British Railways"] = new("Various (Network Rail, TOCs)", "Became British Rail, then privatised", null),
|
||||
["Railtrack"] = new("Network Rail", "Replaced by Network Rail in 2002", "04402220"),
|
||||
["British Airways"] = new("British Airways (IAG)", "Now part of International Airlines Group", "01777777"),
|
||||
["British Caledonian"] = new("British Airways", "Acquired by BA in 1987", null),
|
||||
["British European Airways"] = new("British Airways", "Merged with BOAC to form BA in 1974", null),
|
||||
["BEA"] = new("British Airways", "Merged with BOAC to form BA in 1974", null),
|
||||
["BOAC"] = new("British Airways", "Merged with BEA to form BA in 1974", null),
|
||||
["British Overseas Airways Corporation"] = new("British Airways", "Merged with BEA to form BA in 1974", null),
|
||||
["Dan-Air"] = new("British Airways", "Acquired by BA in 1992", null),
|
||||
|
||||
// Media
|
||||
["Thames Television"] = new("Fremantle", "Lost franchise 1991, production continued", null),
|
||||
["Granada Television"] = new("ITV plc", "Merged to form ITV plc", "04967001"),
|
||||
["Carlton Television"] = new("ITV plc", "Merged with Granada to form ITV", "04967001"),
|
||||
["Yorkshire Television"] = new("ITV plc", "Part of ITV plc", "04967001"),
|
||||
["Tyne Tees Television"] = new("ITV plc", "Part of ITV plc", "04967001"),
|
||||
["Central Television"] = new("ITV plc", "Part of ITV plc", "04967001"),
|
||||
["Anglia Television"] = new("ITV plc", "Part of ITV plc", "04967001"),
|
||||
["HTV"] = new("ITV plc", "Part of ITV plc", "04967001"),
|
||||
["LWT"] = new("ITV plc", "London Weekend Television, part of ITV", "04967001"),
|
||||
["London Weekend Television"] = new("ITV plc", "Part of ITV plc", "04967001"),
|
||||
|
||||
// Construction
|
||||
["Wimpey"] = new("Taylor Wimpey", "Merged with Taylor Woodrow in 2007", "00296805"),
|
||||
["Taylor Woodrow"] = new("Taylor Wimpey", "Merged with Wimpey in 2007", "00296805"),
|
||||
["John Laing"] = new("John Laing Group (infrastructure)", "Construction sold, now infrastructure investor", "05975300"),
|
||||
["Costain Group"] = new("Costain", "Still trading", "00102921"),
|
||||
["Tarmac"] = new("Tarmac (CRH)", "Construction now part of CRH", null),
|
||||
["Alfred McAlpine"] = new("Carillion (dissolved)", "Acquired by Carillion, which collapsed 2018", null),
|
||||
["Carillion"] = new("Dissolved", "Collapsed into liquidation in 2018", "03782379"),
|
||||
["Mowlem"] = new("Carillion (dissolved)", "Acquired by Carillion in 2006", null),
|
||||
["Balfour Beatty"] = new("Balfour Beatty", "Still trading", "00395826"),
|
||||
|
||||
// Insurance
|
||||
["Royal Insurance"] = new("RSA Insurance Group", "Merged with Sun Alliance", "02339826"),
|
||||
["Sun Alliance"] = new("RSA Insurance Group", "Merged with Royal Insurance", "02339826"),
|
||||
["Guardian Royal Exchange"] = new("AXA", "Acquired by AXA in 1999", null),
|
||||
["Commercial Union"] = new("Aviva", "Merged to form CGU, then Aviva", "02468686"),
|
||||
["General Accident"] = new("Aviva", "Merged to form CGU, then Aviva", "02468686"),
|
||||
["CGU"] = new("Aviva", "Rebranded to Aviva in 2002", "02468686"),
|
||||
["Norwich Union"] = new("Aviva", "Rebranded to Aviva in 2009", "02468686"),
|
||||
["Eagle Star"] = new("Zurich", "Acquired by Zurich", null),
|
||||
["Prudential"] = new("Prudential plc / M&G", "UK business demerged as M&G plc", "01397169"),
|
||||
};
|
||||
|
||||
/// <summary>
|
||||
/// Major UK charities and non-profit organisations.
|
||||
/// These are legitimate employers but may not be found via standard company search.
|
||||
/// </summary>
|
||||
public static readonly HashSet<string> CharityEmployers = new(StringComparer.OrdinalIgnoreCase)
|
||||
{
|
||||
// Youth organisations
|
||||
"Girlguiding",
|
||||
"Girlguiding UK",
|
||||
"Girlguiding North East England",
|
||||
"Girl Guides",
|
||||
"Scouts",
|
||||
"Scout Association",
|
||||
"Boys Brigade",
|
||||
"Girls Brigade",
|
||||
"Cadets",
|
||||
"Sea Cadets",
|
||||
"Air Cadets",
|
||||
"Army Cadets",
|
||||
|
||||
// Major charities
|
||||
"British Red Cross",
|
||||
"Oxfam",
|
||||
"Save the Children",
|
||||
"NSPCC",
|
||||
"Barnardo's",
|
||||
"RSPCA",
|
||||
"RSPB",
|
||||
"National Trust",
|
||||
"Cancer Research UK",
|
||||
"British Heart Foundation",
|
||||
"Macmillan Cancer Support",
|
||||
"Marie Curie",
|
||||
"Age UK",
|
||||
"Mind",
|
||||
"Samaritans",
|
||||
"Shelter",
|
||||
"Citizens Advice",
|
||||
"Citizens Advice Bureau",
|
||||
"CAB",
|
||||
"St John Ambulance",
|
||||
"Salvation Army",
|
||||
"YMCA",
|
||||
"YWCA",
|
||||
|
||||
// Religious organisations
|
||||
"Church of England",
|
||||
"Catholic Church",
|
||||
"Methodist Church",
|
||||
"Baptist Church",
|
||||
"Salvation Army",
|
||||
};
|
||||
|
||||
/// <summary>
|
||||
/// Public sector organisations and government bodies.
|
||||
/// These are legitimate employers but not registered at Companies House.
|
||||
/// </summary>
|
||||
public static readonly HashSet<string> PublicSectorEmployers = new(StringComparer.OrdinalIgnoreCase)
|
||||
{
|
||||
// Emergency Services
|
||||
"Metropolitan Police",
|
||||
"Metropolitan Police Service",
|
||||
"Metropolitan Police Engineers",
|
||||
"Met Police",
|
||||
"City of London Police",
|
||||
"British Transport Police",
|
||||
"Police Scotland",
|
||||
"Police Service of Northern Ireland",
|
||||
"PSNI",
|
||||
"London Fire Brigade",
|
||||
"London Ambulance Service",
|
||||
"NHS",
|
||||
"National Health Service",
|
||||
|
||||
// Government Departments
|
||||
"HM Treasury",
|
||||
"Home Office",
|
||||
"Foreign Office",
|
||||
"Ministry of Defence",
|
||||
"MOD",
|
||||
"Department of Health",
|
||||
"Department for Education",
|
||||
"DfE",
|
||||
"Department for Work and Pensions",
|
||||
"DWP",
|
||||
"HMRC",
|
||||
"HM Revenue and Customs",
|
||||
"Cabinet Office",
|
||||
"DVLA",
|
||||
"DVSA",
|
||||
"Environment Agency",
|
||||
"Highways Agency",
|
||||
"Highways England",
|
||||
"National Highways",
|
||||
|
||||
// Armed Forces
|
||||
"British Army",
|
||||
"Royal Navy",
|
||||
"Royal Air Force",
|
||||
"RAF",
|
||||
"Royal Marines",
|
||||
|
||||
// Local Government
|
||||
"London Borough",
|
||||
"County Council",
|
||||
"City Council",
|
||||
"District Council",
|
||||
"Metropolitan Borough",
|
||||
"Borough Council",
|
||||
"Town Council",
|
||||
"Parish Council",
|
||||
"Greater London Council",
|
||||
"GLC",
|
||||
|
||||
// Education
|
||||
"University of",
|
||||
"College of",
|
||||
"School of",
|
||||
|
||||
// Other Public Bodies
|
||||
"BBC",
|
||||
"British Broadcasting Corporation",
|
||||
"Channel 4",
|
||||
"Bank of England",
|
||||
"Royal Mail",
|
||||
"Post Office",
|
||||
"Transport for London",
|
||||
"TfL",
|
||||
"Network Rail",
|
||||
"Ordnance Survey",
|
||||
"Land Registry",
|
||||
"Companies House",
|
||||
"National Archives",
|
||||
"British Library",
|
||||
"British Museum",
|
||||
"National Gallery",
|
||||
"Tate",
|
||||
"Natural History Museum",
|
||||
"Science Museum",
|
||||
"V&A",
|
||||
"Victoria and Albert Museum",
|
||||
};
|
||||
|
||||
/// <summary>
|
||||
/// Patterns that indicate an internal division or department of a larger company.
|
||||
/// These are legitimate employer references but won't be separately registered.
|
||||
/// </summary>
|
||||
public static readonly Dictionary<string, string> DivisionPatterns = new(StringComparer.OrdinalIgnoreCase)
|
||||
{
|
||||
// Airlines
|
||||
["British Airways Technical Support"] = "British Airways",
|
||||
["BA Technical Support"] = "British Airways",
|
||||
["BA Engineering"] = "British Airways",
|
||||
["British Airways Engineering"] = "British Airways",
|
||||
["FBA - British Airways"] = "British Airways",
|
||||
|
||||
// Major employers with divisions
|
||||
["BBC News"] = "BBC",
|
||||
["BBC World Service"] = "BBC",
|
||||
["BBC Studios"] = "BBC",
|
||||
["ITV News"] = "ITV plc",
|
||||
["Sky News"] = "Sky UK",
|
||||
["BT Openreach"] = "BT Group",
|
||||
["Openreach"] = "BT Group",
|
||||
["BT Research"] = "BT Group",
|
||||
["Shell Research"] = "Shell",
|
||||
["BP Research"] = "BP",
|
||||
["Rolls-Royce Aerospace"] = "Rolls-Royce",
|
||||
["Rolls-Royce Marine"] = "Rolls-Royce",
|
||||
["BAE Systems Naval Ships"] = "BAE Systems",
|
||||
["BAE Systems Submarines"] = "BAE Systems",
|
||||
|
||||
// Banks - divisions
|
||||
["Barclays Investment Bank"] = "Barclays",
|
||||
["Barclays Capital"] = "Barclays",
|
||||
["HSBC Investment Bank"] = "HSBC",
|
||||
["Lloyds Commercial Banking"] = "Lloyds Banking Group",
|
||||
["NatWest Markets"] = "NatWest Group",
|
||||
["RBS Markets"] = "NatWest Group",
|
||||
};
|
||||
|
||||
/// <summary>
|
||||
/// Check if an employer name is a known historical company.
|
||||
/// </summary>
|
||||
public static bool IsHistoricalEmployer(string employerName)
|
||||
{
|
||||
if (string.IsNullOrWhiteSpace(employerName))
|
||||
return false;
|
||||
|
||||
return HistoricalCompanies.ContainsKey(employerName.Trim());
|
||||
}
|
||||
|
||||
/// <summary>
|
||||
/// Get information about a historical employer.
|
||||
/// </summary>
|
||||
public static HistoricalEmployerInfo? GetHistoricalEmployerInfo(string employerName)
|
||||
{
|
||||
if (string.IsNullOrWhiteSpace(employerName))
|
||||
return null;
|
||||
|
||||
return HistoricalCompanies.GetValueOrDefault(employerName.Trim());
|
||||
}
|
||||
|
||||
/// <summary>
|
||||
/// Check if an employer is a public sector organisation.
|
||||
/// </summary>
|
||||
public static bool IsPublicSectorEmployer(string employerName)
|
||||
{
|
||||
if (string.IsNullOrWhiteSpace(employerName))
|
||||
return false;
|
||||
|
||||
var name = employerName.Trim();
|
||||
|
||||
// Direct match
|
||||
if (PublicSectorEmployers.Contains(name))
|
||||
return true;
|
||||
|
||||
// Partial match for patterns like "London Borough of X"
|
||||
foreach (var pattern in PublicSectorEmployers)
|
||||
{
|
||||
if (name.Contains(pattern, StringComparison.OrdinalIgnoreCase))
|
||||
return true;
|
||||
}
|
||||
|
||||
return false;
|
||||
}
|
||||
|
||||
/// <summary>
|
||||
/// Check if an employer is a charity or non-profit organisation.
|
||||
/// </summary>
|
||||
public static bool IsCharityEmployer(string employerName)
|
||||
{
|
||||
if (string.IsNullOrWhiteSpace(employerName))
|
||||
return false;
|
||||
|
||||
var name = employerName.Trim();
|
||||
|
||||
// Direct match
|
||||
if (CharityEmployers.Contains(name))
|
||||
return true;
|
||||
|
||||
// Partial match
|
||||
foreach (var pattern in CharityEmployers)
|
||||
{
|
||||
if (name.Contains(pattern, StringComparison.OrdinalIgnoreCase))
|
||||
return true;
|
||||
}
|
||||
|
||||
return false;
|
||||
}
|
||||
|
||||
/// <summary>
|
||||
/// Check if an employer name is an internal division and get the parent company.
|
||||
/// </summary>
|
||||
public static string? GetParentCompanyForDivision(string employerName)
|
||||
{
|
||||
if (string.IsNullOrWhiteSpace(employerName))
|
||||
return null;
|
||||
|
||||
var name = employerName.Trim();
|
||||
|
||||
// Direct match
|
||||
if (DivisionPatterns.TryGetValue(name, out var parent))
|
||||
return parent;
|
||||
|
||||
// Partial match
|
||||
foreach (var (pattern, parentCompany) in DivisionPatterns)
|
||||
{
|
||||
if (name.Contains(pattern, StringComparison.OrdinalIgnoreCase))
|
||||
return parentCompany;
|
||||
}
|
||||
|
||||
return null;
|
||||
}
|
||||
}
|
||||
|
||||
/// <summary>
|
||||
/// Information about a historical employer.
|
||||
/// </summary>
|
||||
public sealed record HistoricalEmployerInfo(
|
||||
string SuccessorName,
|
||||
string Notes,
|
||||
string? CompanyNumber
|
||||
);
|
||||
@@ -122,6 +122,28 @@ public static class UKInstitutions
|
||||
"Wrexham University",
|
||||
"York St John University",
|
||||
|
||||
// Post-1992 Universities (former polytechnics)
|
||||
"Leeds Beckett University",
|
||||
"Birmingham City University",
|
||||
"University of Bedfordshire",
|
||||
"Anglia Ruskin University",
|
||||
"University of Central Lancashire",
|
||||
"University of West London",
|
||||
"University of Northampton",
|
||||
"University of Chichester",
|
||||
"Plymouth Marjon University",
|
||||
"Bath Spa University",
|
||||
"Solent University",
|
||||
"University of Bolton",
|
||||
"University of Cumbria",
|
||||
"University of Chester",
|
||||
"University of Gloucestershire",
|
||||
"University of Suffolk",
|
||||
"Newman University",
|
||||
"Bishop Grosseteste University",
|
||||
"Harper Adams University",
|
||||
"Royal Agricultural University",
|
||||
|
||||
// Scottish Universities
|
||||
"University of Aberdeen",
|
||||
"Abertay University",
|
||||
@@ -134,6 +156,8 @@ public static class UKInstitutions
|
||||
"Bangor University",
|
||||
"University of South Wales",
|
||||
"Wrexham Glyndwr University",
|
||||
"Wrexham University",
|
||||
"Cardiff Metropolitan University",
|
||||
|
||||
// Northern Ireland
|
||||
"Ulster University",
|
||||
@@ -304,6 +328,112 @@ public static class UKInstitutions
|
||||
["South Bank University"] = "London South Bank University",
|
||||
["LSBU"] = "London South Bank University",
|
||||
|
||||
// Historical polytechnic names (became universities in 1992)
|
||||
// These are legitimate institutions that existed under different names
|
||||
["South Bank Polytechnic"] = "London South Bank University",
|
||||
["Polytechnic of the South Bank"] = "London South Bank University",
|
||||
["Thames Polytechnic"] = "University of Greenwich",
|
||||
["Woolwich Polytechnic"] = "University of Greenwich",
|
||||
["Polytechnic of Central London"] = "University of Westminster",
|
||||
["PCL"] = "University of Westminster",
|
||||
["Polytechnic of North London"] = "London Metropolitan University",
|
||||
["City of London Polytechnic"] = "London Metropolitan University",
|
||||
["London Guildhall University"] = "London Metropolitan University",
|
||||
["University of North London"] = "London Metropolitan University",
|
||||
["Polytechnic of East London"] = "University of East London",
|
||||
["North East London Polytechnic"] = "University of East London",
|
||||
["Middlesex Polytechnic"] = "Middlesex University",
|
||||
["Hatfield Polytechnic"] = "University of Hertfordshire",
|
||||
["Sheffield Polytechnic"] = "Sheffield Hallam University",
|
||||
["Sheffield City Polytechnic"] = "Sheffield Hallam University",
|
||||
["Manchester Polytechnic"] = "Manchester Metropolitan University",
|
||||
["Leeds Polytechnic"] = "Leeds Beckett University",
|
||||
["Leeds Metropolitan University"] = "Leeds Beckett University",
|
||||
["Leicester Polytechnic"] = "De Montfort University",
|
||||
["Coventry Polytechnic"] = "Coventry University",
|
||||
["Lanchester Polytechnic"] = "Coventry University",
|
||||
["Brighton Polytechnic"] = "University of Brighton",
|
||||
["Portsmouth Polytechnic"] = "University of Portsmouth",
|
||||
["Plymouth Polytechnic"] = "University of Plymouth",
|
||||
["Polytechnic South West"] = "University of Plymouth",
|
||||
["Oxford Polytechnic"] = "Oxford Brookes University",
|
||||
["Newcastle Polytechnic"] = "Northumbria University",
|
||||
["Newcastle upon Tyne Polytechnic"] = "Northumbria University",
|
||||
["Sunderland Polytechnic"] = "University of Sunderland",
|
||||
["Teesside Polytechnic"] = "Teesside University",
|
||||
["Huddersfield Polytechnic"] = "University of Huddersfield",
|
||||
["Wolverhampton Polytechnic"] = "University of Wolverhampton",
|
||||
["Liverpool Polytechnic"] = "Liverpool John Moores University",
|
||||
["Bristol Polytechnic"] = "University of the West of England",
|
||||
["Kingston Polytechnic"] = "Kingston University",
|
||||
["Nottingham Polytechnic"] = "Nottingham Trent University",
|
||||
["Trent Polytechnic"] = "Nottingham Trent University",
|
||||
["Birmingham Polytechnic"] = "Birmingham City University",
|
||||
["City of Birmingham Polytechnic"] = "Birmingham City University",
|
||||
["University of Central England"] = "Birmingham City University",
|
||||
["UCE Birmingham"] = "Birmingham City University",
|
||||
["Staffordshire Polytechnic"] = "Staffordshire University",
|
||||
["North Staffordshire Polytechnic"] = "Staffordshire University",
|
||||
["Luton College of Higher Education"] = "University of Bedfordshire",
|
||||
["University of Luton"] = "University of Bedfordshire",
|
||||
["Anglia Polytechnic"] = "Anglia Ruskin University",
|
||||
["Anglia Polytechnic University"] = "Anglia Ruskin University",
|
||||
["APU"] = "Anglia Ruskin University",
|
||||
["Cambridgeshire College of Arts and Technology"] = "Anglia Ruskin University",
|
||||
["CCAT"] = "Anglia Ruskin University",
|
||||
["Bournemouth Polytechnic"] = "Bournemouth University",
|
||||
["Dorset Institute of Higher Education"] = "Bournemouth University",
|
||||
["Derby College of Higher Education"] = "University of Derby",
|
||||
["Derbyshire College of Higher Education"] = "University of Derby",
|
||||
["Humberside Polytechnic"] = "University of Lincoln",
|
||||
["Humberside College of Higher Education"] = "University of Lincoln",
|
||||
["University of Humberside"] = "University of Lincoln",
|
||||
["University of Lincolnshire and Humberside"] = "University of Lincoln",
|
||||
["Central Lancashire Polytechnic"] = "University of Central Lancashire",
|
||||
["Preston Polytechnic"] = "University of Central Lancashire",
|
||||
["Lancashire Polytechnic"] = "University of Central Lancashire",
|
||||
["Glamorgan Polytechnic"] = "University of South Wales",
|
||||
["Polytechnic of Wales"] = "University of South Wales",
|
||||
["University of Glamorgan"] = "University of South Wales",
|
||||
["Robert Gordon Institute of Technology"] = "Robert Gordon University",
|
||||
["RGIT"] = "Robert Gordon University",
|
||||
["Napier Polytechnic"] = "Edinburgh Napier University",
|
||||
["Napier College"] = "Edinburgh Napier University",
|
||||
["Glasgow Polytechnic"] = "Glasgow Caledonian University",
|
||||
["Queen's College Glasgow"] = "Glasgow Caledonian University",
|
||||
["Dundee Institute of Technology"] = "Abertay University",
|
||||
["Dundee College of Technology"] = "Abertay University",
|
||||
|
||||
// Other historical name changes
|
||||
["Roehampton Institute"] = "Roehampton University",
|
||||
["University of Surrey Roehampton"] = "Roehampton University",
|
||||
["Thames Valley University"] = "University of West London",
|
||||
["Polytechnic of West London"] = "University of West London",
|
||||
["Ealing College of Higher Education"] = "University of West London",
|
||||
["London College of Music and Media"] = "University of West London",
|
||||
["University College Northampton"] = "University of Northampton",
|
||||
["Nene College"] = "University of Northampton",
|
||||
["University College Worcester"] = "University of Worcester",
|
||||
["Worcester College of Higher Education"] = "University of Worcester",
|
||||
["University College Chichester"] = "University of Chichester",
|
||||
["Chichester Institute of Higher Education"] = "University of Chichester",
|
||||
["College of St Mark and St John"] = "Plymouth Marjon University",
|
||||
["Marjon"] = "Plymouth Marjon University",
|
||||
["University of St Mark and St John"] = "Plymouth Marjon University",
|
||||
["University College Falmouth"] = "Falmouth University",
|
||||
["Falmouth College of Arts"] = "Falmouth University",
|
||||
["Bath College of Higher Education"] = "Bath Spa University",
|
||||
["Bath Spa University College"] = "Bath Spa University",
|
||||
["Liverpool Institute of Higher Education"] = "Liverpool Hope University",
|
||||
["Liverpool Hope University College"] = "Liverpool Hope University",
|
||||
["University of Wales, Newport"] = "University of South Wales",
|
||||
["University of Wales Institute, Cardiff"] = "Cardiff Metropolitan University",
|
||||
["UWIC"] = "Cardiff Metropolitan University",
|
||||
["North East Wales Institute"] = "Wrexham University",
|
||||
["NEWI"] = "Wrexham University",
|
||||
["Glyndwr University"] = "Wrexham University",
|
||||
["Wrexham Glyndwr University"] = "Wrexham University",
|
||||
|
||||
// Other common variations
|
||||
["Open University"] = "The Open University",
|
||||
["OU"] = "The Open University",
|
||||
|
||||
@@ -11,4 +11,9 @@ public interface ICVCheckService
|
||||
Task<List<CVCheckDto>> GetUserChecksAsync(Guid userId);
|
||||
Task<VeracityReport?> GetReportAsync(Guid checkId, Guid userId);
|
||||
Task<bool> DeleteCheckAsync(Guid checkId, Guid userId);
|
||||
|
||||
/// <summary>
|
||||
/// GDPR: Delete all CV checks and associated data for a user (right to erasure).
|
||||
/// </summary>
|
||||
Task<int> DeleteAllUserDataAsync(Guid userId);
|
||||
}
|
||||
|
||||
@@ -8,8 +8,22 @@ public interface ICompanyNameMatcherService
|
||||
/// Uses AI to semantically compare a company name from a CV against Companies House candidates.
|
||||
/// Returns the best match with confidence score and reasoning.
|
||||
/// </summary>
|
||||
/// <param name="cvCompanyName">The company name as written on the CV</param>
|
||||
/// <param name="candidates">List of potential matches from Companies House</param>
|
||||
/// <param name="industryHint">Optional industry context for well-known brands (e.g., "pharmacy/healthcare retail")</param>
|
||||
/// <param name="cancellationToken">Cancellation token</param>
|
||||
Task<SemanticMatchResult?> FindBestMatchAsync(
|
||||
string cvCompanyName,
|
||||
List<CompanyCandidate> candidates,
|
||||
string? industryHint = null,
|
||||
CancellationToken cancellationToken = default);
|
||||
|
||||
/// <summary>
|
||||
/// Uses AI to detect if a company name contains multiple companies and extract them.
|
||||
/// Returns null or single-item list if it's a single company (e.g., "Ernst & Young").
|
||||
/// Returns multiple items if compound (e.g., "ASDA/WALMART" -> ["ASDA", "WALMART"]).
|
||||
/// </summary>
|
||||
Task<List<string>?> ExtractCompanyNamesAsync(
|
||||
string companyName,
|
||||
CancellationToken cancellationToken = default);
|
||||
}
|
||||
|
||||
106
src/RealCV.Infrastructure/Jobs/DataRetentionJob.cs
Normal file
@@ -0,0 +1,106 @@
|
||||
using Microsoft.EntityFrameworkCore;
|
||||
using Microsoft.Extensions.Configuration;
|
||||
using Microsoft.Extensions.Logging;
|
||||
using RealCV.Application.Interfaces;
|
||||
using RealCV.Domain.Enums;
|
||||
using RealCV.Infrastructure.Data;
|
||||
|
||||
namespace RealCV.Infrastructure.Jobs;
|
||||
|
||||
/// <summary>
|
||||
/// GDPR compliance job that automatically deletes old CV check data
|
||||
/// based on configured retention period.
|
||||
/// </summary>
|
||||
public sealed class DataRetentionJob
|
||||
{
|
||||
private readonly ApplicationDbContext _dbContext;
|
||||
private readonly IFileStorageService _fileStorageService;
|
||||
private readonly ILogger<DataRetentionJob> _logger;
|
||||
private readonly int _retentionDays;
|
||||
|
||||
public DataRetentionJob(
|
||||
ApplicationDbContext dbContext,
|
||||
IFileStorageService fileStorageService,
|
||||
IConfiguration configuration,
|
||||
ILogger<DataRetentionJob> logger)
|
||||
{
|
||||
_dbContext = dbContext;
|
||||
_fileStorageService = fileStorageService;
|
||||
_logger = logger;
|
||||
_retentionDays = configuration.GetValue<int>("DataRetention:CVCheckRetentionDays", 30);
|
||||
}
|
||||
|
||||
public async Task ExecuteAsync(CancellationToken cancellationToken = default)
|
||||
{
|
||||
_logger.LogInformation("Starting GDPR data retention job (retention: {Days} days)", _retentionDays);
|
||||
|
||||
try
|
||||
{
|
||||
var cutoffDate = DateTime.UtcNow.AddDays(-_retentionDays);
|
||||
|
||||
// Find old completed CV checks that should be deleted
|
||||
var oldChecks = await _dbContext.CVChecks
|
||||
.Include(c => c.Flags)
|
||||
.Where(c => c.CompletedAt != null && c.CompletedAt < cutoffDate)
|
||||
.Where(c => c.Status == CheckStatus.Completed || c.Status == CheckStatus.Failed)
|
||||
.ToListAsync(cancellationToken);
|
||||
|
||||
if (oldChecks.Count == 0)
|
||||
{
|
||||
_logger.LogInformation("No CV checks older than {Days} days found for deletion", _retentionDays);
|
||||
return;
|
||||
}
|
||||
|
||||
_logger.LogInformation("Found {Count} CV checks older than {Days} days for deletion", oldChecks.Count, _retentionDays);
|
||||
|
||||
var deletedCount = 0;
|
||||
var fileDeletedCount = 0;
|
||||
|
||||
foreach (var check in oldChecks)
|
||||
{
|
||||
try
|
||||
{
|
||||
// Delete any remaining files (should already be deleted after processing, but be thorough)
|
||||
if (!string.IsNullOrWhiteSpace(check.BlobUrl))
|
||||
{
|
||||
try
|
||||
{
|
||||
await _fileStorageService.DeleteAsync(check.BlobUrl);
|
||||
fileDeletedCount++;
|
||||
_logger.LogDebug("Deleted orphaned file for CV check {CheckId}", check.Id);
|
||||
}
|
||||
catch (Exception ex)
|
||||
{
|
||||
_logger.LogWarning(ex, "Failed to delete file for CV check {CheckId}", check.Id);
|
||||
}
|
||||
}
|
||||
|
||||
// Delete associated flags
|
||||
_dbContext.CVFlags.RemoveRange(check.Flags);
|
||||
|
||||
// Delete the CV check record
|
||||
_dbContext.CVChecks.Remove(check);
|
||||
deletedCount++;
|
||||
|
||||
_logger.LogDebug("Marked CV check {CheckId} for deletion (created: {Created})",
|
||||
check.Id, check.CreatedAt);
|
||||
}
|
||||
catch (Exception ex)
|
||||
{
|
||||
_logger.LogError(ex, "Error processing CV check {CheckId} for deletion", check.Id);
|
||||
}
|
||||
}
|
||||
|
||||
await _dbContext.SaveChangesAsync(cancellationToken);
|
||||
|
||||
_logger.LogInformation(
|
||||
"GDPR data retention job completed. Deleted {DeletedCount} CV checks and {FileCount} orphaned files",
|
||||
deletedCount, fileDeletedCount);
|
||||
}
|
||||
catch (Exception ex)
|
||||
{
|
||||
_logger.LogError(ex, "Error in GDPR data retention job");
|
||||
throw;
|
||||
}
|
||||
}
|
||||
}
|
||||
@@ -92,6 +92,19 @@ public sealed class ProcessCVCheckJob
|
||||
"Parsed CV for check {CheckId}: {EmploymentCount} employment entries",
|
||||
cvCheckId, cvData.Employment.Count);
|
||||
|
||||
// Validate that the CV contains meaningful data
|
||||
// A CV with no name, no employment AND no education is likely a parsing failure
|
||||
if (cvData.Employment.Count == 0 && cvData.Education.Count == 0 &&
|
||||
(string.IsNullOrWhiteSpace(cvData.FullName) || cvData.FullName == "Unknown"))
|
||||
{
|
||||
_logger.LogWarning(
|
||||
"CV check {CheckId} parsed with no extractable data - possible scanned/image PDF or parsing failure",
|
||||
cvCheckId);
|
||||
throw new InvalidOperationException(
|
||||
"Could not extract any employment or education data from this CV. " +
|
||||
"The file may be a scanned image, password-protected, or in an unsupported format.");
|
||||
}
|
||||
|
||||
// Step 4: Save extracted data
|
||||
cvCheck.ExtractedDataJson = JsonSerializer.Serialize(cvData, JsonDefaults.CamelCaseIndented);
|
||||
cvCheck.ProcessingStage = "Verifying Employment";
|
||||
@@ -265,6 +278,12 @@ public sealed class ProcessCVCheckJob
|
||||
cvCheckId, score);
|
||||
|
||||
await _auditService.LogAsync(cvCheck.UserId, AuditActions.CVProcessed, "CVCheck", cvCheckId, $"Score: {score}");
|
||||
|
||||
// GDPR: Delete the uploaded CV file immediately after processing
|
||||
// We only need the extracted data and report, not the original file
|
||||
await DeleteCVFileAsync(cvCheck.BlobUrl, cvCheckId);
|
||||
cvCheck.BlobUrl = string.Empty; // Clear the URL as file no longer exists
|
||||
await _dbContext.SaveChangesAsync(cancellationToken);
|
||||
}
|
||||
catch (Exception ex)
|
||||
{
|
||||
@@ -273,6 +292,8 @@ public sealed class ProcessCVCheckJob
|
||||
try
|
||||
{
|
||||
cvCheck.Status = CheckStatus.Failed;
|
||||
// Store a user-friendly error message
|
||||
cvCheck.ProcessingStage = GetUserFriendlyErrorMessage(ex);
|
||||
// Use CancellationToken.None to ensure failure status is saved even if original token is cancelled
|
||||
await _dbContext.SaveChangesAsync(CancellationToken.None);
|
||||
}
|
||||
@@ -287,6 +308,29 @@ public sealed class ProcessCVCheckJob
|
||||
}
|
||||
}
|
||||
|
||||
/// <summary>
|
||||
/// GDPR: Safely delete the uploaded CV file after processing.
|
||||
/// </summary>
|
||||
private async Task DeleteCVFileAsync(string blobUrl, Guid cvCheckId)
|
||||
{
|
||||
if (string.IsNullOrWhiteSpace(blobUrl))
|
||||
{
|
||||
_logger.LogDebug("No file to delete for CV check {CheckId}", cvCheckId);
|
||||
return;
|
||||
}
|
||||
|
||||
try
|
||||
{
|
||||
await _fileStorageService.DeleteAsync(blobUrl);
|
||||
_logger.LogInformation("GDPR: Deleted CV file for check {CheckId}", cvCheckId);
|
||||
}
|
||||
catch (Exception ex)
|
||||
{
|
||||
// Log but don't fail the job - file deletion is important but shouldn't break processing
|
||||
_logger.LogWarning(ex, "Failed to delete CV file for check {CheckId}: {BlobUrl}", cvCheckId, blobUrl);
|
||||
}
|
||||
}
|
||||
|
||||
private static (int Score, List<FlagResult> Flags) CalculateVeracityScore(
|
||||
List<CompanyVerificationResult> verifications,
|
||||
List<EducationVerificationResult> educationResults,
|
||||
@@ -1382,4 +1426,39 @@ public sealed class ProcessCVCheckJob
|
||||
obj.FlagType?.ToUpperInvariant() ?? "");
|
||||
}
|
||||
}
|
||||
|
||||
/// <summary>
|
||||
/// Returns a user-friendly error message based on the exception type.
|
||||
/// </summary>
|
||||
private static string GetUserFriendlyErrorMessage(Exception ex)
|
||||
{
|
||||
// Check for specific error patterns
|
||||
var message = ex.Message;
|
||||
|
||||
if (message.Contains("no extractable data", StringComparison.OrdinalIgnoreCase) ||
|
||||
message.Contains("Could not extract any employment", StringComparison.OrdinalIgnoreCase))
|
||||
{
|
||||
return "No useful data could be extracted from this CV. The file may be a scanned image or in an unsupported format.";
|
||||
}
|
||||
|
||||
if (message.Contains("API usage limits", StringComparison.OrdinalIgnoreCase) ||
|
||||
message.Contains("rate limit", StringComparison.OrdinalIgnoreCase))
|
||||
{
|
||||
return "Service temporarily unavailable. Please try again in a few minutes.";
|
||||
}
|
||||
|
||||
if (message.Contains("Could not extract text", StringComparison.OrdinalIgnoreCase))
|
||||
{
|
||||
return "Could not read the CV file. Please ensure it's a valid PDF or DOCX document.";
|
||||
}
|
||||
|
||||
if (message.Contains("password", StringComparison.OrdinalIgnoreCase) ||
|
||||
message.Contains("encrypted", StringComparison.OrdinalIgnoreCase))
|
||||
{
|
||||
return "This CV appears to be password-protected. Please upload an unprotected version.";
|
||||
}
|
||||
|
||||
// Default message
|
||||
return "An error occurred while processing your CV. Please try uploading again.";
|
||||
}
|
||||
}
|
||||
|
||||
@@ -33,28 +33,53 @@ public sealed class AICompanyNameMatcherService : ICompanyNameMatcherService
|
||||
Compare the company name from a CV against official Companies House records.
|
||||
|
||||
CV Company Name: "{CV_COMPANY}"
|
||||
|
||||
{INDUSTRY_CONTEXT}
|
||||
Companies House Candidates:
|
||||
{CANDIDATES}
|
||||
|
||||
Determine which candidate (if any) is the SAME company as the CV entry.
|
||||
|
||||
Rules:
|
||||
1. A match requires the companies to be the SAME organisation, not just similar names
|
||||
2. "Families First CiC" is NOT the same as "FAMILIES AGAINST CONFORMITY LTD" - different words = different companies
|
||||
3. Trading names should match their registered entity (e.g., "Tesco" matches "TESCO PLC")
|
||||
4. Subsidiaries can match if clearly the same organisation (e.g., "ASDA" could match "ASDA STORES LIMITED")
|
||||
5. Acronyms in parentheses are abbreviations of the full name (e.g., "North Halifax Partnership (NHP)" = "NORTH HALIFAX PARTNERSHIP")
|
||||
6. CiC/CIC = Community Interest Company, LLP = Limited Liability Partnership - these are legal suffixes
|
||||
7. If the CV name contains all the key words of a candidate (ignoring Ltd/Limited/CIC/etc.), it's likely a match
|
||||
8. If NO candidate is clearly the same company, return "NONE" as the best match
|
||||
Matching Guidelines:
|
||||
1. MATCH if the CV name is the same organisation as a candidate (even if registered name differs):
|
||||
- "Boots" → "BOOTS UK LIMITED" ✓ (trading name = registered company)
|
||||
- "Boots" → "THE BOOTS COMPANY PLC" ✓ (trading name = parent company)
|
||||
- "Tesco" → "TESCO PLC" ✓ (trading name = registered name)
|
||||
- "ASDA" → "ASDA STORES LIMITED" ✓ (brand = operating company)
|
||||
- "Legal & General" → "LEGAL & GENERAL GROUP PLC" ✓ (brand = holding company)
|
||||
- "Checkout.com" → "CHECKOUT.COM PAYMENTS LIMITED" ✓ (exact match)
|
||||
- "EY UK" → "ERNST & YOUNG LLP" ✓ (trading name = partnership)
|
||||
- "Royal Bank of Scotland" → "THE ROYAL BANK OF SCOTLAND PUBLIC LIMITED COMPANY" ✓
|
||||
|
||||
2. DO NOT MATCH if the candidate adds significant DIFFERENT words that indicate a different business:
|
||||
- "Boots" ≠ "BOOTS AND BEARDS" ✗ (pharmacy chain is NOT a barber/grooming business)
|
||||
- "Legal & General" ≠ "LEGAL LIMITED" ✗ (major insurer is NOT a generic "legal" company)
|
||||
- "Checkout.com" ≠ "XN CHECKOUT LIMITED" ✗ (fintech is NOT an unrelated checkout company)
|
||||
- "EY UK" ≠ "EY UK GDPR REPRESENTATIVE LIMITED" ✗ (main employer, not a subsidiary)
|
||||
|
||||
3. KEY DISTINCTION - Geographic/legal suffixes are OK, but new business words are NOT:
|
||||
- "Boots" → "BOOTS UK LIMITED" ✓ (UK is just geographic qualifier)
|
||||
- "Boots" → "BOOTS AND BEARDS" ✗ (BEARDS indicates different business)
|
||||
- "Meridian Holdings" → "MERIDIAN (THE ORIGINAL) LIMITED" ✗ ("THE ORIGINAL" suggests different business)
|
||||
- "Paramount Consulting UK" → "PARAMOUNT LIMITED" ✗ (missing "Consulting" - different type)
|
||||
- "Apex Technology Partners" → "APEX LIMITED" ✗ (missing "Technology Partners")
|
||||
|
||||
4. Legal suffixes (Ltd, Limited, PLC, LLP, CiC) should be ignored when comparing names
|
||||
|
||||
5. Adding "THE", "GROUP", "UK", or "HOLDINGS" to a name doesn't make it a different company
|
||||
|
||||
6. When the CV mentions a well-known brand, prefer the main operating/holding company over obscure matches
|
||||
|
||||
7. If INDUSTRY CONTEXT is provided, use it to reject candidates clearly in different industries
|
||||
|
||||
CRITICAL: Return the COMPLETE company number exactly as shown (e.g., "SC083026", "02366995").
|
||||
Do NOT truncate or abbreviate the company number.
|
||||
|
||||
Respond with this exact JSON structure:
|
||||
{
|
||||
"bestMatchCompanyNumber": "string (company number of best match, or 'NONE' if no valid match)",
|
||||
"bestMatchCompanyNumber": "COMPLETE company number from the list above, or 'NONE' if no valid match",
|
||||
"confidenceScore": number (0-100, where 100 = certain match, 0 = no match),
|
||||
"matchType": "string (Exact, TradingName, Subsidiary, Parent, NoMatch)",
|
||||
"reasoning": "string (brief explanation of why this is or isn't a match)"
|
||||
"matchType": "Exact|TradingName|Subsidiary|Parent|NoMatch",
|
||||
"reasoning": "brief explanation"
|
||||
}
|
||||
""";
|
||||
|
||||
@@ -69,6 +94,7 @@ public sealed class AICompanyNameMatcherService : ICompanyNameMatcherService
|
||||
public async Task<SemanticMatchResult?> FindBestMatchAsync(
|
||||
string cvCompanyName,
|
||||
List<CompanyCandidate> candidates,
|
||||
string? industryHint = null,
|
||||
CancellationToken cancellationToken = default)
|
||||
{
|
||||
if (string.IsNullOrWhiteSpace(cvCompanyName) || candidates.Count == 0)
|
||||
@@ -76,16 +102,23 @@ public sealed class AICompanyNameMatcherService : ICompanyNameMatcherService
|
||||
return null;
|
||||
}
|
||||
|
||||
_logger.LogDebug("Using AI to match '{CVCompany}' against {Count} candidates",
|
||||
cvCompanyName, candidates.Count);
|
||||
_logger.LogDebug("Using AI to match '{CVCompany}' against {Count} candidates (industry: {Industry})",
|
||||
cvCompanyName, candidates.Count, industryHint ?? "unknown");
|
||||
|
||||
try
|
||||
{
|
||||
// Format candidates with company number prominently displayed to prevent truncation
|
||||
var candidatesText = string.Join("\n", candidates.Select((c, i) =>
|
||||
$"{i + 1}. {c.CompanyName} (Number: {c.CompanyNumber}, Status: {c.CompanyStatus ?? "Unknown"})"));
|
||||
$"[{c.CompanyNumber}] {c.CompanyName} (Status: {c.CompanyStatus ?? "Unknown"})"));
|
||||
|
||||
// Add industry context if available
|
||||
var industryContext = string.IsNullOrEmpty(industryHint)
|
||||
? ""
|
||||
: $"Industry Context: This is a well-known brand in {industryHint}. Reject candidates clearly in different industries.\n";
|
||||
|
||||
var prompt = MatchingPrompt
|
||||
.Replace("{CV_COMPANY}", cvCompanyName)
|
||||
.Replace("{INDUSTRY_CONTEXT}", industryContext)
|
||||
.Replace("{CANDIDATES}", candidatesText);
|
||||
|
||||
var messages = new List<Message>
|
||||
@@ -95,8 +128,8 @@ public sealed class AICompanyNameMatcherService : ICompanyNameMatcherService
|
||||
|
||||
var parameters = new MessageParameters
|
||||
{
|
||||
Model = "claude-sonnet-4-20250514",
|
||||
MaxTokens = 1024,
|
||||
Model = "claude-3-5-haiku-20241022",
|
||||
MaxTokens = 512,
|
||||
Messages = messages,
|
||||
System = [new SystemMessage(SystemPrompt)]
|
||||
};
|
||||
@@ -127,7 +160,8 @@ public sealed class AICompanyNameMatcherService : ICompanyNameMatcherService
|
||||
aiResponse.BestMatchCompanyNumber, aiResponse.ConfidenceScore, aiResponse.Reasoning);
|
||||
|
||||
// Find the matched candidate
|
||||
if (aiResponse.BestMatchCompanyNumber == "NONE" || aiResponse.ConfidenceScore < 50)
|
||||
// Lower threshold to 30 - we have fuzzy validation as backup
|
||||
if (aiResponse.BestMatchCompanyNumber == "NONE" || aiResponse.ConfidenceScore < 30)
|
||||
{
|
||||
return new SemanticMatchResult
|
||||
{
|
||||
@@ -142,10 +176,40 @@ public sealed class AICompanyNameMatcherService : ICompanyNameMatcherService
|
||||
var matchedCandidate = candidates.FirstOrDefault(c =>
|
||||
c.CompanyNumber.Equals(aiResponse.BestMatchCompanyNumber, StringComparison.OrdinalIgnoreCase));
|
||||
|
||||
// If exact match not found, try to find a candidate that starts with the returned number
|
||||
// This handles cases where AI truncates "09052626" to "09" or similar
|
||||
if (matchedCandidate is null && !string.IsNullOrWhiteSpace(aiResponse.BestMatchCompanyNumber)
|
||||
&& aiResponse.BestMatchCompanyNumber != "NONE")
|
||||
{
|
||||
var partialMatch = candidates.FirstOrDefault(c =>
|
||||
c.CompanyNumber.StartsWith(aiResponse.BestMatchCompanyNumber, StringComparison.OrdinalIgnoreCase));
|
||||
|
||||
if (partialMatch is not null)
|
||||
{
|
||||
_logger.LogDebug("AI returned partial company number '{Partial}', matched to full number '{Full}'",
|
||||
aiResponse.BestMatchCompanyNumber, partialMatch.CompanyNumber);
|
||||
matchedCandidate = partialMatch;
|
||||
}
|
||||
else
|
||||
{
|
||||
// Try reverse - maybe AI returned a longer string that contains the actual number
|
||||
var reverseMatch = candidates.FirstOrDefault(c =>
|
||||
aiResponse.BestMatchCompanyNumber.Contains(c.CompanyNumber, StringComparison.OrdinalIgnoreCase));
|
||||
|
||||
if (reverseMatch is not null)
|
||||
{
|
||||
_logger.LogDebug("AI returned string containing company number '{Number}'",
|
||||
reverseMatch.CompanyNumber);
|
||||
matchedCandidate = reverseMatch;
|
||||
}
|
||||
}
|
||||
}
|
||||
|
||||
if (matchedCandidate is null)
|
||||
{
|
||||
_logger.LogWarning("AI returned company number {Number} not in candidates list",
|
||||
aiResponse.BestMatchCompanyNumber);
|
||||
_logger.LogWarning("AI returned company number '{Number}' not in candidates list. Candidates: {Candidates}",
|
||||
aiResponse.BestMatchCompanyNumber,
|
||||
string.Join(", ", candidates.Select(c => c.CompanyNumber)));
|
||||
return null;
|
||||
}
|
||||
|
||||
@@ -164,4 +228,360 @@ public sealed class AICompanyNameMatcherService : ICompanyNameMatcherService
|
||||
return null; // Fall back to fuzzy matching
|
||||
}
|
||||
}
|
||||
|
||||
/// <summary>
|
||||
/// Well-known company names that contain "&" or "and" but are SINGLE companies.
|
||||
/// These should NOT be split into multiple parts.
|
||||
/// </summary>
|
||||
private static readonly HashSet<string> KnownSingleCompanyNames = new(StringComparer.OrdinalIgnoreCase)
|
||||
{
|
||||
// Big 4 / Professional Services
|
||||
"Ernst & Young", "Ernst and Young", "EY",
|
||||
"Deloitte and Touche", "Deloitte & Touche",
|
||||
"PricewaterhouseCoopers", "Price Waterhouse",
|
||||
"KPMG",
|
||||
"Accenture",
|
||||
|
||||
// Retail
|
||||
"Marks & Spencer", "Marks and Spencer", "M&S",
|
||||
"Fortnum & Mason", "Fortnum and Mason",
|
||||
"Crabtree & Evelyn",
|
||||
"Holland & Barrett", "Holland and Barrett",
|
||||
"Past Times & Present",
|
||||
"Barnes & Noble",
|
||||
"Abercrombie & Fitch",
|
||||
"Dolce & Gabbana",
|
||||
"Bang & Olufsen",
|
||||
"Crate & Barrel",
|
||||
"Bed Bath & Beyond",
|
||||
"Bath & Body Works",
|
||||
|
||||
// Consumer Goods
|
||||
"Procter & Gamble", "Procter and Gamble", "P&G",
|
||||
"Johnson & Johnson", "Johnson and Johnson", "J&J",
|
||||
"Reckitt & Colman", "Reckitt and Colman",
|
||||
"Colgate-Palmolive",
|
||||
"Unilever",
|
||||
"Henkel",
|
||||
|
||||
// Food & Beverage
|
||||
"Prêt A Manger", "Pret A Manger",
|
||||
"Fortnum and Mason",
|
||||
"Lyle & Scott",
|
||||
"Ben & Jerry's", "Ben and Jerry's",
|
||||
"Baskin & Robbins",
|
||||
"Haribo",
|
||||
|
||||
// Finance & Insurance
|
||||
"Standard & Poor's", "Standard and Poor's", "S&P",
|
||||
"Moody's",
|
||||
"Fitch Ratings",
|
||||
"Lloyd's of London",
|
||||
"Coutts & Co", "Coutts and Co",
|
||||
"Brown Shipley & Co",
|
||||
"Schroders",
|
||||
|
||||
// Law Firms (common patterns)
|
||||
"Allen & Overy", "Allen and Overy",
|
||||
"Clifford Chance",
|
||||
"Freshfields Bruckhaus Deringer",
|
||||
"Linklaters",
|
||||
"Slaughter and May", "Slaughter & May",
|
||||
"Herbert Smith Freehills",
|
||||
"Hogan Lovells",
|
||||
"Norton Rose Fulbright",
|
||||
"DLA Piper",
|
||||
"Baker & McKenzie", "Baker McKenzie",
|
||||
"Eversheds Sutherland",
|
||||
"Ashurst",
|
||||
"CMS",
|
||||
"Simmons & Simmons",
|
||||
"Travers Smith",
|
||||
"Macfarlanes",
|
||||
"Addleshaw Goddard",
|
||||
"Pinsent Masons",
|
||||
"Shoosmiths",
|
||||
"Irwin Mitchell",
|
||||
"DAC Beachcroft",
|
||||
"Weightmans",
|
||||
"Browne Jacobson",
|
||||
"Mills & Reeve", "Mills and Reeve",
|
||||
"Taylor Wessing",
|
||||
"Osborne Clarke",
|
||||
"Bird & Bird", "Bird and Bird",
|
||||
"Withers",
|
||||
"Charles Russell Speechlys",
|
||||
"Stephenson Harwood",
|
||||
"Watson Farley & Williams",
|
||||
"Clyde & Co", "Clyde and Co",
|
||||
"Reed Smith",
|
||||
"Kennedys",
|
||||
"Fieldfisher",
|
||||
"RPC",
|
||||
"Womble Bond Dickinson",
|
||||
"Burges Salmon",
|
||||
"Trowers & Hamlins", "Trowers and Hamlins",
|
||||
"Bevan Brittan",
|
||||
"Veale Wasbrough Vizards",
|
||||
|
||||
// Media & Entertainment
|
||||
"Simon & Schuster",
|
||||
"Warner Bros", "Warner Brothers",
|
||||
"William Morris Endeavor",
|
||||
"Creative Artists Agency",
|
||||
|
||||
// Automotive
|
||||
"Rolls-Royce",
|
||||
"Aston Martin",
|
||||
"Jaguar Land Rover",
|
||||
|
||||
// Pharmaceuticals
|
||||
"GlaxoSmithKline", "GSK",
|
||||
"AstraZeneca",
|
||||
"Smith & Nephew",
|
||||
"Roche",
|
||||
|
||||
// Engineering & Construction
|
||||
"Mott MacDonald",
|
||||
"Arup",
|
||||
"Laing O'Rourke",
|
||||
"Kier",
|
||||
"Balfour Beatty",
|
||||
"Taylor Wimpey",
|
||||
"Persimmon",
|
||||
"Bellway",
|
||||
"Berkeley",
|
||||
|
||||
// Technology
|
||||
"Hewlett-Packard", "HP",
|
||||
"Texas Instruments",
|
||||
"AT&T",
|
||||
"T-Mobile",
|
||||
|
||||
// Other
|
||||
"Young & Co", "Young and Co",
|
||||
"Smith & Williamson",
|
||||
"Grant Thornton",
|
||||
"BDO",
|
||||
"RSM",
|
||||
"Mazars",
|
||||
"Moore Kingston Smith",
|
||||
"Crowe",
|
||||
"PKF",
|
||||
"Saffery Champness",
|
||||
"Buzzacott",
|
||||
"HW Fisher",
|
||||
"Haysmacintyre",
|
||||
"Menzies",
|
||||
"MHA",
|
||||
"Azets",
|
||||
"Dains",
|
||||
"Streets",
|
||||
"Armstrong Watson",
|
||||
|
||||
// Common department/division patterns (not to be split)
|
||||
"Sales and Marketing",
|
||||
"Research and Development", "R&D",
|
||||
"Human Resources",
|
||||
"Finance and Operations",
|
||||
"Legal and Compliance",
|
||||
"IT and Digital",
|
||||
"Supply Chain and Logistics",
|
||||
};
|
||||
|
||||
/// <summary>
|
||||
/// Patterns that indicate a name is likely referring to divisions/departments of ONE company.
|
||||
/// </summary>
|
||||
private static readonly string[] SingleCompanyPatterns =
|
||||
[
|
||||
" stores and ", // "Tesco Stores and Distribution"
|
||||
" retail and ", // "Next Retail and Online"
|
||||
" uk and ", // "BMW UK and Ireland"
|
||||
" europe and ", // "Google Europe and Middle East"
|
||||
" division and ",
|
||||
" department and ",
|
||||
" services and ",
|
||||
" group and ",
|
||||
" plc and ",
|
||||
" ltd and ",
|
||||
" limited and ",
|
||||
];
|
||||
|
||||
/// <summary>
|
||||
/// Determines if a company name refers to multiple companies and extracts them.
|
||||
/// Uses rule-based detection instead of AI for better performance and cost savings.
|
||||
/// </summary>
|
||||
public Task<List<string>?> ExtractCompanyNamesAsync(
|
||||
string companyName,
|
||||
CancellationToken cancellationToken = default)
|
||||
{
|
||||
if (string.IsNullOrWhiteSpace(companyName))
|
||||
{
|
||||
return Task.FromResult<List<string>?>(null);
|
||||
}
|
||||
|
||||
_logger.LogDebug("Checking if '{CompanyName}' is a compound name (rule-based)", companyName);
|
||||
|
||||
var result = DetectCompoundName(companyName);
|
||||
|
||||
if (result is null)
|
||||
{
|
||||
_logger.LogDebug("'{CompanyName}' is a single company", companyName);
|
||||
return Task.FromResult<List<string>?>(null);
|
||||
}
|
||||
|
||||
_logger.LogDebug("'{CompanyName}' detected as compound, parts: [{Parts}]",
|
||||
companyName, string.Join(", ", result));
|
||||
|
||||
return Task.FromResult<List<string>?>(result);
|
||||
}
|
||||
|
||||
/// <summary>
|
||||
/// Rule-based detection of compound company names.
|
||||
/// Returns null if single company, or list of parts if multiple companies.
|
||||
/// </summary>
|
||||
private List<string>? DetectCompoundName(string name)
|
||||
{
|
||||
var trimmedName = name.Trim();
|
||||
|
||||
// Check 1: Is this a known single company name?
|
||||
if (IsKnownSingleCompany(trimmedName))
|
||||
{
|
||||
return null;
|
||||
}
|
||||
|
||||
// Check 2: Does it match single-company patterns (departments/divisions)?
|
||||
if (MatchesSingleCompanyPattern(trimmedName))
|
||||
{
|
||||
return null;
|
||||
}
|
||||
|
||||
// Check 3: "/" is a strong indicator of multiple companies
|
||||
if (trimmedName.Contains('/'))
|
||||
{
|
||||
var slashParts = trimmedName
|
||||
.Split('/')
|
||||
.Select(p => p.Trim())
|
||||
.Where(p => p.Length >= 2)
|
||||
.ToList();
|
||||
|
||||
if (slashParts.Count >= 2)
|
||||
{
|
||||
return slashParts;
|
||||
}
|
||||
}
|
||||
|
||||
// Check 4: " & " or " and " between what look like separate company names
|
||||
// Only split if both parts look like distinct company names
|
||||
var andMatch = System.Text.RegularExpressions.Regex.Match(
|
||||
trimmedName,
|
||||
@"^(.+?)\s+(?:&|and)\s+(.+)$",
|
||||
System.Text.RegularExpressions.RegexOptions.IgnoreCase);
|
||||
|
||||
if (andMatch.Success)
|
||||
{
|
||||
var part1 = andMatch.Groups[1].Value.Trim();
|
||||
var part2 = andMatch.Groups[2].Value.Trim();
|
||||
|
||||
// If the combined name is a known single company, don't split
|
||||
if (IsKnownSingleCompany(trimmedName))
|
||||
{
|
||||
return null;
|
||||
}
|
||||
|
||||
// If either part is very short (like initials), probably not a split
|
||||
if (part1.Length < 3 || part2.Length < 3)
|
||||
{
|
||||
return null;
|
||||
}
|
||||
|
||||
// If part2 looks like a department/role descriptor, don't split
|
||||
if (IsDepartmentOrRole(part2))
|
||||
{
|
||||
return null;
|
||||
}
|
||||
|
||||
// If both parts look like independent company names, this is likely compound
|
||||
if (LooksLikeCompanyName(part1) && LooksLikeCompanyName(part2))
|
||||
{
|
||||
return [part1, part2];
|
||||
}
|
||||
}
|
||||
|
||||
// Default: treat as single company
|
||||
return null;
|
||||
}
|
||||
|
||||
private static bool IsKnownSingleCompany(string name)
|
||||
{
|
||||
// Direct match
|
||||
if (KnownSingleCompanyNames.Contains(name))
|
||||
{
|
||||
return true;
|
||||
}
|
||||
|
||||
// Check if the name contains any known single company as a substring
|
||||
foreach (var known in KnownSingleCompanyNames)
|
||||
{
|
||||
if (name.Contains(known, StringComparison.OrdinalIgnoreCase))
|
||||
{
|
||||
return true;
|
||||
}
|
||||
}
|
||||
|
||||
return false;
|
||||
}
|
||||
|
||||
private static bool MatchesSingleCompanyPattern(string name)
|
||||
{
|
||||
var lowerName = name.ToLowerInvariant();
|
||||
return SingleCompanyPatterns.Any(pattern => lowerName.Contains(pattern));
|
||||
}
|
||||
|
||||
private static bool IsDepartmentOrRole(string text)
|
||||
{
|
||||
var lower = text.ToLowerInvariant();
|
||||
string[] departmentKeywords =
|
||||
[
|
||||
"department", "division", "team", "group", "unit",
|
||||
"services", "solutions", "operations", "logistics",
|
||||
"distribution", "manufacturing", "production",
|
||||
"marketing", "sales", "finance", "accounting",
|
||||
"hr", "human resources", "it", "technology",
|
||||
"research", "development", "r&d", "engineering",
|
||||
"retail", "wholesale", "stores", "online",
|
||||
"consulting", "advisory", "support"
|
||||
];
|
||||
|
||||
return departmentKeywords.Any(kw => lower.Contains(kw));
|
||||
}
|
||||
|
||||
private static bool LooksLikeCompanyName(string text)
|
||||
{
|
||||
// A company name typically:
|
||||
// - Is at least 2 characters
|
||||
// - Starts with a capital letter (or is all caps)
|
||||
// - May end with Ltd, Limited, PLC, Inc, etc.
|
||||
|
||||
if (text.Length < 2)
|
||||
{
|
||||
return false;
|
||||
}
|
||||
|
||||
// If it contains company suffixes, definitely a company name
|
||||
string[] companySuffixes = ["ltd", "limited", "plc", "inc", "corp", "llp", "llc", "group", "holdings"];
|
||||
var lower = text.ToLowerInvariant();
|
||||
if (companySuffixes.Any(s => lower.EndsWith(s) || lower.Contains($" {s}")))
|
||||
{
|
||||
return true;
|
||||
}
|
||||
|
||||
// If it looks like it could be a company (starts with capital, reasonable length)
|
||||
if (char.IsUpper(text[0]) && text.Length >= 3)
|
||||
{
|
||||
return true;
|
||||
}
|
||||
|
||||
return false;
|
||||
}
|
||||
}
|
||||
|
||||
@@ -185,17 +185,78 @@ public sealed class CVCheckService : ICVCheckService
|
||||
|
||||
var fileName = cvCheck.OriginalFileName;
|
||||
|
||||
// GDPR: Delete the uploaded file if it still exists
|
||||
if (!string.IsNullOrWhiteSpace(cvCheck.BlobUrl))
|
||||
{
|
||||
try
|
||||
{
|
||||
await _fileStorageService.DeleteAsync(cvCheck.BlobUrl);
|
||||
_logger.LogDebug("Deleted file for CV check {CheckId}", checkId);
|
||||
}
|
||||
catch (Exception ex)
|
||||
{
|
||||
_logger.LogWarning(ex, "Failed to delete file for CV check {CheckId}", checkId);
|
||||
// Continue with deletion even if file deletion fails
|
||||
}
|
||||
}
|
||||
|
||||
_dbContext.CVFlags.RemoveRange(cvCheck.Flags);
|
||||
_dbContext.CVChecks.Remove(cvCheck);
|
||||
await _dbContext.SaveChangesAsync();
|
||||
|
||||
_logger.LogInformation("Deleted CV check {CheckId} for user {UserId}", checkId, userId);
|
||||
_logger.LogInformation("GDPR: Deleted CV check {CheckId} and associated data for user {UserId}", checkId, userId);
|
||||
|
||||
await _auditService.LogAsync(userId, AuditActions.CVDeleted, "CVCheck", checkId, $"File: {fileName}");
|
||||
|
||||
return true;
|
||||
}
|
||||
|
||||
public async Task<int> DeleteAllUserDataAsync(Guid userId)
|
||||
{
|
||||
_logger.LogInformation("GDPR: Deleting all CV data for user {UserId}", userId);
|
||||
|
||||
var userChecks = await _dbContext.CVChecks
|
||||
.Include(c => c.Flags)
|
||||
.Where(c => c.UserId == userId)
|
||||
.ToListAsync();
|
||||
|
||||
if (userChecks.Count == 0)
|
||||
{
|
||||
_logger.LogDebug("No CV checks found for user {UserId}", userId);
|
||||
return 0;
|
||||
}
|
||||
|
||||
var deletedCount = 0;
|
||||
|
||||
foreach (var check in userChecks)
|
||||
{
|
||||
// Delete the file if it exists
|
||||
if (!string.IsNullOrWhiteSpace(check.BlobUrl))
|
||||
{
|
||||
try
|
||||
{
|
||||
await _fileStorageService.DeleteAsync(check.BlobUrl);
|
||||
}
|
||||
catch (Exception ex)
|
||||
{
|
||||
_logger.LogWarning(ex, "Failed to delete file for CV check {CheckId}", check.Id);
|
||||
}
|
||||
}
|
||||
|
||||
_dbContext.CVFlags.RemoveRange(check.Flags);
|
||||
_dbContext.CVChecks.Remove(check);
|
||||
deletedCount++;
|
||||
}
|
||||
|
||||
await _dbContext.SaveChangesAsync();
|
||||
|
||||
_logger.LogInformation("GDPR: Deleted {Count} CV checks for user {UserId}", deletedCount, userId);
|
||||
|
||||
await _auditService.LogAsync(userId, AuditActions.CVDeleted, null, null, $"Deleted all data: {deletedCount} checks");
|
||||
|
||||
return deletedCount;
|
||||
}
|
||||
|
||||
private static CVCheckDto MapToDto(CVCheck cvCheck)
|
||||
{
|
||||
return new CVCheckDto
|
||||
|
||||
@@ -171,8 +171,8 @@ public sealed class CVParserService : ICVParserService
|
||||
|
||||
var parameters = new MessageParameters
|
||||
{
|
||||
Model = "claude-sonnet-4-20250514",
|
||||
MaxTokens = 4096,
|
||||
Model = "claude-3-5-haiku-20241022",
|
||||
MaxTokens = 2048,
|
||||
Messages = messages,
|
||||
System = [new SystemMessage(SystemPrompt)]
|
||||
};
|
||||
|
||||
@@ -120,6 +120,15 @@ public sealed class TimelineAnalyserService : ITimelineAnalyserService
|
||||
var earlier = sortedEmployment[i];
|
||||
var later = sortedEmployment[j];
|
||||
|
||||
// Skip overlaps at the same company (internal promotions/transfers)
|
||||
if (IsSameCompany(earlier.CompanyName, later.CompanyName))
|
||||
{
|
||||
_logger.LogDebug(
|
||||
"Ignoring overlap at same company: {Company1} -> {Company2}",
|
||||
earlier.CompanyName, later.CompanyName);
|
||||
continue;
|
||||
}
|
||||
|
||||
var overlap = CalculateOverlap(earlier, later);
|
||||
|
||||
if (overlap is not null && overlap.Value.Months > AllowedOverlapMonths)
|
||||
@@ -143,6 +152,59 @@ public sealed class TimelineAnalyserService : ITimelineAnalyserService
|
||||
return overlaps;
|
||||
}
|
||||
|
||||
/// <summary>
|
||||
/// Determines if two company names refer to the same company.
|
||||
/// Handles variations like "BMW" vs "BMW UK" vs "BMW Group".
|
||||
/// </summary>
|
||||
private static bool IsSameCompany(string? company1, string? company2)
|
||||
{
|
||||
if (string.IsNullOrWhiteSpace(company1) || string.IsNullOrWhiteSpace(company2))
|
||||
{
|
||||
return false;
|
||||
}
|
||||
|
||||
// Normalize names for comparison
|
||||
var name1 = NormalizeCompanyName(company1);
|
||||
var name2 = NormalizeCompanyName(company2);
|
||||
|
||||
// Exact match after normalization
|
||||
if (name1.Equals(name2, StringComparison.OrdinalIgnoreCase))
|
||||
{
|
||||
return true;
|
||||
}
|
||||
|
||||
// Check if one contains the other (for "BMW" vs "BMW UK" cases)
|
||||
if (name1.Length >= 3 && name2.Length >= 3)
|
||||
{
|
||||
if (name1.StartsWith(name2, StringComparison.OrdinalIgnoreCase) ||
|
||||
name2.StartsWith(name1, StringComparison.OrdinalIgnoreCase))
|
||||
{
|
||||
return true;
|
||||
}
|
||||
}
|
||||
|
||||
return false;
|
||||
}
|
||||
|
||||
private static string NormalizeCompanyName(string name)
|
||||
{
|
||||
// Remove common suffixes and normalize
|
||||
var normalized = name.Trim();
|
||||
|
||||
string[] suffixes = ["Ltd", "Ltd.", "Limited", "PLC", "Plc", "Inc", "Inc.",
|
||||
"Corporation", "Corp", "Corp.", "UK", "Group", "(UK)", "& Co", "& Co."];
|
||||
|
||||
foreach (var suffix in suffixes)
|
||||
{
|
||||
if (normalized.EndsWith(" " + suffix, StringComparison.OrdinalIgnoreCase))
|
||||
{
|
||||
normalized = normalized[..^(suffix.Length + 1)].Trim();
|
||||
}
|
||||
}
|
||||
|
||||
return normalized;
|
||||
}
|
||||
|
||||
private static (DateOnly Start, DateOnly End, int Months)? CalculateOverlap(
|
||||
EmploymentEntry earlier,
|
||||
EmploymentEntry later)
|
||||
|
||||
13
src/RealCV.Web/Components/Layout/AuthLayout.razor
Normal file
@@ -0,0 +1,13 @@
|
||||
@inherits LayoutComponentBase
|
||||
|
||||
<div class="d-flex flex-column min-vh-100">
|
||||
<main class="flex-grow-1">
|
||||
@Body
|
||||
</main>
|
||||
</div>
|
||||
|
||||
<div id="blazor-error-ui" class="alert alert-danger fixed-bottom m-3" style="display: none;">
|
||||
An unhandled error has occurred.
|
||||
<a href="" class="alert-link reload">Reload</a>
|
||||
<button type="button" class="btn-close float-end dismiss" aria-label="Close"></button>
|
||||
</div>
|
||||
@@ -78,8 +78,16 @@
|
||||
</main>
|
||||
|
||||
<footer class="text-light py-4 mt-auto" style="background-color: var(--realcv-footer-bg);">
|
||||
<div class="container text-center">
|
||||
<p class="mb-0">© @DateTime.Now.Year RealCV. All rights reserved.</p>
|
||||
<div class="container">
|
||||
<div class="row align-items-center">
|
||||
<div class="col-md-6 text-center text-md-start mb-2 mb-md-0">
|
||||
<p class="mb-0">© @DateTime.Now.Year RealCV. All rights reserved.</p>
|
||||
</div>
|
||||
<div class="col-md-6 text-center text-md-end">
|
||||
<a href="/privacy" class="text-light text-decoration-none me-3">Privacy Policy</a>
|
||||
<span class="text-muted small">GDPR Compliant</span>
|
||||
</div>
|
||||
</div>
|
||||
</div>
|
||||
</footer>
|
||||
</div>
|
||||
|
||||
@@ -1,6 +1,6 @@
|
||||
@page "/account/login"
|
||||
@using RealCV.Web.Components.Layout
|
||||
@layout MainLayout
|
||||
@layout AuthLayout
|
||||
|
||||
@using Microsoft.AspNetCore.Identity
|
||||
@using RealCV.Infrastructure.Identity
|
||||
@@ -14,9 +14,9 @@
|
||||
<!-- Left side - Form -->
|
||||
<div class="auth-form-side">
|
||||
<div class="auth-form-wrapper">
|
||||
<div class="text-center mb-4">
|
||||
<div class="text-center mb-5">
|
||||
<a href="/">
|
||||
<img src="images/RealCV_Logo_Transparent.png" alt="RealCV" class="auth-logo" />
|
||||
<img src="images/RealCV_Logo_Transparent.png" alt="RealCV" class="auth-logo" style="height: 60px;" />
|
||||
</a>
|
||||
</div>
|
||||
|
||||
@@ -123,7 +123,7 @@
|
||||
|
||||
<div class="auth-testimonial">
|
||||
<blockquote>
|
||||
"RealCV has transformed our hiring process. We catch discrepancies we would have missed before."
|
||||
"RealCV has transformed our recruitment process. We catch discrepancies we would have missed before."
|
||||
</blockquote>
|
||||
<cite>- HR Director, Tech Company</cite>
|
||||
</div>
|
||||
|
||||
@@ -1,6 +1,6 @@
|
||||
@page "/account/register"
|
||||
@using RealCV.Web.Components.Layout
|
||||
@layout MainLayout
|
||||
@layout AuthLayout
|
||||
@rendermode InteractiveServer
|
||||
|
||||
@using Microsoft.AspNetCore.Identity
|
||||
@@ -16,9 +16,9 @@
|
||||
<!-- Left side - Form -->
|
||||
<div class="auth-form-side">
|
||||
<div class="auth-form-wrapper">
|
||||
<div class="text-center mb-4">
|
||||
<div class="text-center mb-5">
|
||||
<a href="/">
|
||||
<img src="images/RealCV_Logo_Transparent.png" alt="RealCV" class="auth-logo" />
|
||||
<img src="images/RealCV_Logo_Transparent.png" alt="RealCV" class="auth-logo" style="height: 60px;" />
|
||||
</a>
|
||||
</div>
|
||||
|
||||
@@ -97,9 +97,9 @@
|
||||
|
||||
<p class="text-center text-muted small mb-4">
|
||||
By creating an account, you agree to our
|
||||
<a href="#" class="text-decoration-none">Terms of Service</a>
|
||||
<a href="/privacy" class="text-decoration-none">Terms of Service</a>
|
||||
and
|
||||
<a href="#" class="text-decoration-none">Privacy Policy</a>
|
||||
<a href="/privacy" class="text-decoration-none">Privacy Policy</a>
|
||||
</p>
|
||||
|
||||
<div class="auth-divider">
|
||||
@@ -123,9 +123,9 @@
|
||||
<path d="M9.796 1.343c-.527-1.79-3.065-1.79-3.592 0l-.094.319a.873.873 0 0 1-1.255.52l-.292-.16c-1.64-.892-3.433.902-2.54 2.541l.159.292a.873.873 0 0 1-.52 1.255l-.319.094c-1.79.527-1.79 3.065 0 3.592l.319.094a.873.873 0 0 1 .52 1.255l-.16.292c-.892 1.64.901 3.434 2.541 2.54l.292-.159a.873.873 0 0 1 1.255.52l.094.319c.527 1.79 3.065 1.79 3.592 0l.094-.319a.873.873 0 0 1 1.255-.52l.292.16c1.64.893 3.434-.902 2.54-2.541l-.159-.292a.873.873 0 0 1 .52-1.255l.319-.094c1.79-.527 1.79-3.065 0-3.592l-.319-.094a.873.873 0 0 1-.52-1.255l.16-.292c.893-1.64-.902-3.433-2.541-2.54l-.292.159a.873.873 0 0 1-1.255-.52l-.094-.319zm-2.633.283c.246-.835 1.428-.835 1.674 0l.094.319a1.873 1.873 0 0 0 2.693 1.115l.291-.16c.764-.415 1.6.42 1.184 1.185l-.159.292a1.873 1.873 0 0 0 1.116 2.692l.318.094c.835.246.835 1.428 0 1.674l-.319.094a1.873 1.873 0 0 0-1.115 2.693l.16.291c.415.764-.42 1.6-1.185 1.184l-.291-.159a1.873 1.873 0 0 0-2.693 1.116l-.094.318c-.246.835-1.428.835-1.674 0l-.094-.319a1.873 1.873 0 0 0-2.692-1.115l-.292.16c-.764.415-1.6-.42-1.184-1.185l.159-.291A1.873 1.873 0 0 0 1.945 8.93l-.319-.094c-.835-.246-.835-1.428 0-1.674l.319-.094A1.873 1.873 0 0 0 3.06 4.377l-.16-.292c-.415-.764.42-1.6 1.185-1.184l.292.159a1.873 1.873 0 0 0 2.692-1.115l.094-.319z"/>
|
||||
</svg>
|
||||
</div>
|
||||
<h2 class="auth-brand-title">Start Your Free Trial</h2>
|
||||
<h2 class="auth-brand-title">Create Your Free Account</h2>
|
||||
<p class="auth-brand-text">
|
||||
Get 3 free CV verifications to experience the power of AI-driven credential analysis.
|
||||
Get 3 free CV verifications per month. No credit card required.
|
||||
</p>
|
||||
|
||||
<div class="auth-features">
|
||||
@@ -157,7 +157,7 @@
|
||||
|
||||
<div class="auth-testimonial">
|
||||
<blockquote>
|
||||
"We reduced bad hires by 40% in the first quarter using RealCV."
|
||||
"We reduced unsuitable appointments by 40% in the first quarter using RealCV."
|
||||
</blockquote>
|
||||
<cite>- Recruitment Manager, Financial Services</cite>
|
||||
</div>
|
||||
|
||||
@@ -151,23 +151,23 @@
|
||||
{
|
||||
<div class="file-list-item">
|
||||
<div class="d-flex align-items-center">
|
||||
<div class="file-type-icon me-3 @(file.Name.EndsWith(".pdf", StringComparison.OrdinalIgnoreCase) ? "pdf" : "docx")">
|
||||
<div class="file-type-icon me-2 @(file.Name.EndsWith(".pdf", StringComparison.OrdinalIgnoreCase) ? "pdf" : "docx")">
|
||||
@if (file.Name.EndsWith(".pdf", StringComparison.OrdinalIgnoreCase))
|
||||
{
|
||||
<svg xmlns="http://www.w3.org/2000/svg" width="18" height="18" fill="currentColor" viewBox="0 0 16 16">
|
||||
<svg xmlns="http://www.w3.org/2000/svg" width="14" height="14" fill="currentColor" viewBox="0 0 16 16">
|
||||
<path d="M14 14V4.5L9.5 0H4a2 2 0 0 0-2 2v12a2 2 0 0 0 2 2h8a2 2 0 0 0 2-2zM9.5 3A1.5 1.5 0 0 0 11 4.5h2V14a1 1 0 0 1-1 1H4a1 1 0 0 1-1-1V2a1 1 0 0 1 1-1h5.5v2z"/>
|
||||
</svg>
|
||||
}
|
||||
else
|
||||
{
|
||||
<svg xmlns="http://www.w3.org/2000/svg" width="18" height="18" fill="currentColor" viewBox="0 0 16 16">
|
||||
<svg xmlns="http://www.w3.org/2000/svg" width="14" height="14" fill="currentColor" viewBox="0 0 16 16">
|
||||
<path d="M14 14V4.5L9.5 0H4a2 2 0 0 0-2 2v12a2 2 0 0 0 2 2h8a2 2 0 0 0 2-2zM9.5 3A1.5 1.5 0 0 0 11 4.5h2V14a1 1 0 0 1-1 1H4a1 1 0 0 1-1-1V2a1 1 0 0 1 1-1h5.5v2z"/>
|
||||
</svg>
|
||||
}
|
||||
</div>
|
||||
<div class="flex-grow-1">
|
||||
<p class="mb-0 fw-medium">@file.Name</p>
|
||||
<small class="text-muted">@FormatFileSize(file.Size)</small>
|
||||
<div class="flex-grow-1 min-width-0">
|
||||
<span class="file-name">@file.Name</span>
|
||||
<span class="file-size">@FormatFileSize(file.Size)</span>
|
||||
</div>
|
||||
</div>
|
||||
<button class="btn btn-sm btn-outline-danger" @onclick="() => RemoveFile(file)">
|
||||
@@ -267,39 +267,71 @@
|
||||
user-select: none;
|
||||
}
|
||||
|
||||
.file-list {
|
||||
border: 1px solid var(--realcv-gray-200);
|
||||
border-radius: 8px;
|
||||
overflow: hidden;
|
||||
}
|
||||
|
||||
.file-list-item {
|
||||
display: flex;
|
||||
align-items: center;
|
||||
justify-content: space-between;
|
||||
border: 1px solid var(--realcv-gray-200);
|
||||
border-radius: 12px;
|
||||
padding: 1rem;
|
||||
margin-bottom: 0.75rem;
|
||||
padding: 0.5rem 0.75rem;
|
||||
background: var(--realcv-bg-surface);
|
||||
transition: all 0.2s ease;
|
||||
border-bottom: 1px solid var(--realcv-gray-200);
|
||||
transition: background 0.15s ease;
|
||||
}
|
||||
|
||||
.file-list-item:last-child {
|
||||
border-bottom: none;
|
||||
}
|
||||
|
||||
.file-list-item:hover {
|
||||
border-color: var(--realcv-primary);
|
||||
box-shadow: 0 4px 12px rgba(59, 111, 212, 0.08);
|
||||
background: var(--realcv-bg-muted);
|
||||
}
|
||||
|
||||
.file-list-item:nth-child(even) {
|
||||
background: rgba(0, 0, 0, 0.015);
|
||||
}
|
||||
|
||||
.file-list-item:nth-child(even):hover {
|
||||
background: var(--realcv-bg-muted);
|
||||
}
|
||||
|
||||
.file-name {
|
||||
font-size: 0.875rem;
|
||||
font-weight: 500;
|
||||
color: var(--realcv-text-primary);
|
||||
overflow: hidden;
|
||||
text-overflow: ellipsis;
|
||||
white-space: nowrap;
|
||||
}
|
||||
|
||||
.file-size {
|
||||
font-size: 0.75rem;
|
||||
color: var(--realcv-gray-500);
|
||||
margin-left: 0.5rem;
|
||||
flex-shrink: 0;
|
||||
}
|
||||
|
||||
.file-type-icon {
|
||||
width: 40px;
|
||||
height: 40px;
|
||||
border-radius: 10px;
|
||||
width: 28px;
|
||||
height: 28px;
|
||||
border-radius: 4px;
|
||||
display: flex;
|
||||
align-items: center;
|
||||
justify-content: center;
|
||||
flex-shrink: 0;
|
||||
}
|
||||
|
||||
.file-type-icon.pdf {
|
||||
background: linear-gradient(135deg, #fde8e8 0%, #fcd9d9 100%);
|
||||
background: #fef2f2;
|
||||
color: #dc2626;
|
||||
}
|
||||
|
||||
.file-type-icon.docx {
|
||||
background: linear-gradient(135deg, #e3ecf7 0%, #d4e4f4 100%);
|
||||
background: #eff6ff;
|
||||
color: var(--realcv-primary);
|
||||
}
|
||||
|
||||
|
||||
@@ -118,10 +118,10 @@
|
||||
else
|
||||
{
|
||||
<!-- Stats Cards -->
|
||||
<div class="row mb-4 g-4">
|
||||
<div class="row mb-3 g-3">
|
||||
<div class="col-md-4">
|
||||
<div class="card border-0 shadow-sm stat-card h-100">
|
||||
<div class="card-body p-4">
|
||||
<div class="card-body p-3">
|
||||
<div class="d-flex align-items-center">
|
||||
<div class="stat-icon stat-icon-primary me-3">
|
||||
<svg xmlns="http://www.w3.org/2000/svg" width="28" height="28" fill="currentColor" viewBox="0 0 16 16">
|
||||
@@ -139,7 +139,7 @@
|
||||
</div>
|
||||
<div class="col-md-4">
|
||||
<div class="card border-0 shadow-sm stat-card h-100">
|
||||
<div class="card-body p-4">
|
||||
<div class="card-body p-3">
|
||||
<div class="d-flex align-items-center">
|
||||
<div class="stat-icon stat-icon-success me-3">
|
||||
<svg xmlns="http://www.w3.org/2000/svg" width="28" height="28" fill="currentColor" viewBox="0 0 16 16">
|
||||
@@ -157,7 +157,7 @@
|
||||
</div>
|
||||
<div class="col-md-4">
|
||||
<div class="card border-0 shadow-sm stat-card h-100">
|
||||
<div class="card-body p-4">
|
||||
<div class="card-body p-3">
|
||||
<div class="d-flex align-items-center">
|
||||
<div class="stat-icon stat-icon-warning me-3">
|
||||
<svg xmlns="http://www.w3.org/2000/svg" width="28" height="28" fill="currentColor" viewBox="0 0 16 16">
|
||||
@@ -176,7 +176,7 @@
|
||||
|
||||
<!-- Checks List -->
|
||||
<div class="card border-0 shadow-sm">
|
||||
<div class="card-header py-3 border-bottom" style="background-color: var(--realcv-bg-surface);">
|
||||
<div class="card-header py-2 px-3 border-bottom" style="background-color: var(--realcv-bg-surface);">
|
||||
<div class="d-flex justify-content-between align-items-center">
|
||||
<div class="d-flex align-items-center gap-3">
|
||||
<h5 class="mb-0 fw-bold">Recent CV Checks</h5>
|
||||
@@ -203,17 +203,17 @@
|
||||
<table class="table table-hover align-middle mb-0">
|
||||
<thead>
|
||||
<tr style="background-color: var(--realcv-bg-muted);">
|
||||
<th class="border-0 ps-3 py-3" style="width: 40px;">
|
||||
<th class="border-0 ps-3 py-2" style="width: 40px;">
|
||||
<input type="checkbox" class="form-check-input"
|
||||
checked="@IsAllSelected()"
|
||||
@onchange="ToggleSelectAll"
|
||||
title="Select all" />
|
||||
</th>
|
||||
<th class="border-0 py-3 text-uppercase small fw-semibold text-muted" style="letter-spacing: 0.05em;">Candidate</th>
|
||||
<th class="border-0 py-3 text-uppercase small fw-semibold text-muted" style="letter-spacing: 0.05em;">Uploaded</th>
|
||||
<th class="border-0 py-3 text-uppercase small fw-semibold text-muted text-center" style="letter-spacing: 0.05em;">Status</th>
|
||||
<th class="border-0 py-3 text-uppercase small fw-semibold text-muted text-center" style="letter-spacing: 0.05em;">Score</th>
|
||||
<th class="border-0 py-3 pe-4 text-uppercase small fw-semibold text-muted text-end" style="letter-spacing: 0.05em;">Actions</th>
|
||||
<th class="border-0 py-2 text-uppercase small fw-semibold text-muted" style="letter-spacing: 0.05em;">Candidate</th>
|
||||
<th class="border-0 py-2 text-uppercase small fw-semibold text-muted" style="letter-spacing: 0.05em;">Uploaded</th>
|
||||
<th class="border-0 py-2 text-uppercase small fw-semibold text-muted text-center" style="letter-spacing: 0.05em;">Status</th>
|
||||
<th class="border-0 py-2 text-uppercase small fw-semibold text-muted text-center" style="letter-spacing: 0.05em;">Score</th>
|
||||
<th class="border-0 py-2 pe-4 text-uppercase small fw-semibold text-muted text-end" style="letter-spacing: 0.05em;">Actions</th>
|
||||
</tr>
|
||||
</thead>
|
||||
<tbody>
|
||||
@@ -221,15 +221,15 @@
|
||||
{
|
||||
<tr class="@(check.Status == "Completed" ? "cursor-pointer" : "") @(_selectedIds.Contains(check.Id) ? "table-active" : "")"
|
||||
@onclick="() => ViewReport(check)">
|
||||
<td class="ps-3 py-3" @onclick:stopPropagation="true">
|
||||
<td class="ps-3 py-2" @onclick:stopPropagation="true">
|
||||
<input type="checkbox" class="form-check-input"
|
||||
checked="@_selectedIds.Contains(check.Id)"
|
||||
@onchange="() => ToggleSelection(check.Id)" />
|
||||
</td>
|
||||
<td class="py-3">
|
||||
<td class="py-2">
|
||||
<div class="d-flex align-items-center">
|
||||
<div class="file-icon-wrapper me-3">
|
||||
<svg xmlns="http://www.w3.org/2000/svg" width="24" height="24" fill="currentColor" class="bi bi-file-earmark-person text-primary" viewBox="0 0 16 16">
|
||||
<div class="file-icon-wrapper me-2">
|
||||
<svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" fill="currentColor" class="bi bi-file-earmark-person text-primary" viewBox="0 0 16 16">
|
||||
<path d="M11 8a3 3 0 1 1-6 0 3 3 0 0 1 6 0z"/>
|
||||
<path d="M14 14V4.5L9.5 0H4a2 2 0 0 0-2 2v12a2 2 0 0 0 2 2h8a2 2 0 0 0 2-2zM9.5 3A1.5 1.5 0 0 0 11 4.5h2v9.255S12 12 8 12s-5 1.755-5 1.755V2a1 1 0 0 1 1-1h5.5v2z"/>
|
||||
</svg>
|
||||
@@ -240,17 +240,17 @@
|
||||
</div>
|
||||
</div>
|
||||
</td>
|
||||
<td class="py-3">
|
||||
<td class="py-2">
|
||||
<div>
|
||||
<p class="mb-0 small">@check.CreatedAt.ToString("dd MMM yyyy")</p>
|
||||
<small class="text-muted">@check.CreatedAt.ToString("HH:mm")</small>
|
||||
</div>
|
||||
</td>
|
||||
<td class="py-3 text-center">
|
||||
<td class="py-2 text-center">
|
||||
@switch (check.Status)
|
||||
{
|
||||
case "Completed":
|
||||
<span class="badge rounded-pill bg-success-subtle text-success px-3 py-2">
|
||||
<span class="badge rounded-pill bg-success-subtle text-success px-2 py-1">
|
||||
<svg xmlns="http://www.w3.org/2000/svg" width="12" height="12" fill="currentColor" class="bi bi-check-circle-fill me-1" viewBox="0 0 16 16">
|
||||
<path d="M16 8A8 8 0 1 1 0 8a8 8 0 0 1 16 0zm-3.97-3.03a.75.75 0 0 0-1.08.022L7.477 9.417 5.384 7.323a.75.75 0 0 0-1.06 1.06L6.97 11.03a.75.75 0 0 0 1.079-.02l3.992-4.99a.75.75 0 0 0-.01-1.05z"/>
|
||||
</svg>
|
||||
@@ -258,13 +258,13 @@
|
||||
</span>
|
||||
break;
|
||||
case "Processing":
|
||||
<span class="badge rounded-pill bg-primary-subtle text-primary px-3 py-2">
|
||||
<span class="badge rounded-pill bg-primary-subtle text-primary px-2 py-1">
|
||||
<span class="spinner-border spinner-border-sm me-1" role="status" style="width: 0.75rem; height: 0.75rem;"></span>
|
||||
@(check.ProcessingStage ?? "Processing")
|
||||
</span>
|
||||
break;
|
||||
case "Pending":
|
||||
<span class="badge rounded-pill bg-secondary-subtle text-secondary px-3 py-2">
|
||||
<span class="badge rounded-pill bg-secondary-subtle text-secondary px-2 py-1">
|
||||
<svg xmlns="http://www.w3.org/2000/svg" width="12" height="12" fill="currentColor" class="bi bi-clock me-1" viewBox="0 0 16 16">
|
||||
<path d="M8 3.5a.5.5 0 0 0-1 0V9a.5.5 0 0 0 .252.434l3.5 2a.5.5 0 0 0 .496-.868L8 8.71V3.5z"/>
|
||||
<path d="M8 16A8 8 0 1 0 8 0a8 8 0 0 0 0 16zm7-8A7 7 0 1 1 1 8a7 7 0 0 1 14 0z"/>
|
||||
@@ -273,7 +273,7 @@
|
||||
</span>
|
||||
break;
|
||||
case "Failed":
|
||||
<span class="badge rounded-pill bg-danger-subtle text-danger px-3 py-2">
|
||||
<span class="badge rounded-pill bg-danger-subtle text-danger px-2 py-1">
|
||||
<svg xmlns="http://www.w3.org/2000/svg" width="12" height="12" fill="currentColor" class="bi bi-x-circle-fill me-1" viewBox="0 0 16 16">
|
||||
<path d="M16 8A8 8 0 1 1 0 8a8 8 0 0 1 16 0zM5.354 4.646a.5.5 0 1 0-.708.708L7.293 8l-2.647 2.646a.5.5 0 0 0 .708.708L8 8.707l2.646 2.647a.5.5 0 0 0 .708-.708L8.707 8l2.647-2.646a.5.5 0 0 0-.708-.708L8 7.293 5.354 4.646z"/>
|
||||
</svg>
|
||||
@@ -281,11 +281,11 @@
|
||||
</span>
|
||||
break;
|
||||
default:
|
||||
<span class="badge rounded-pill bg-secondary-subtle text-secondary px-3 py-2">@check.Status</span>
|
||||
<span class="badge rounded-pill bg-secondary-subtle text-secondary px-2 py-1">@check.Status</span>
|
||||
break;
|
||||
}
|
||||
</td>
|
||||
<td class="py-3 text-center">
|
||||
<td class="py-2 text-center">
|
||||
@if (check.VeracityScore.HasValue)
|
||||
{
|
||||
<div class="score-ring-container" title="Veracity Score: @check.VeracityScore%">
|
||||
@@ -303,7 +303,7 @@
|
||||
<span class="text-muted">--</span>
|
||||
}
|
||||
</td>
|
||||
<td class="py-3 pe-4 text-end">
|
||||
<td class="py-2 pe-4 text-end">
|
||||
<div class="d-flex justify-content-end align-items-center gap-2">
|
||||
@if (check.Status == "Completed")
|
||||
{
|
||||
@@ -424,10 +424,10 @@
|
||||
}
|
||||
|
||||
.file-icon-wrapper {
|
||||
width: 44px;
|
||||
height: 44px;
|
||||
width: 36px;
|
||||
height: 36px;
|
||||
background: linear-gradient(135deg, #e8f1fa 0%, #d4e4f4 100%);
|
||||
border-radius: 10px;
|
||||
border-radius: 8px;
|
||||
display: flex;
|
||||
align-items: center;
|
||||
justify-content: center;
|
||||
@@ -435,8 +435,8 @@
|
||||
|
||||
.score-ring-container {
|
||||
position: relative;
|
||||
width: 52px;
|
||||
height: 52px;
|
||||
width: 44px;
|
||||
height: 44px;
|
||||
display: inline-flex;
|
||||
align-items: center;
|
||||
justify-content: center;
|
||||
|
||||
@@ -182,6 +182,126 @@
|
||||
</div>
|
||||
</section>
|
||||
|
||||
<!-- Why RealCV Section -->
|
||||
<section class="py-5" style="background: linear-gradient(135deg, #1e3a5f 0%, #0f172a 100%);">
|
||||
<div class="container">
|
||||
<div class="text-center mb-5">
|
||||
<h2 class="fw-bold mb-3 text-white" style="font-size: 2.25rem;">Why Choose RealCV?</h2>
|
||||
<p style="font-size: 1.125rem; color: rgba(255,255,255,0.9);">Make better recruitment decisions with verified candidate information</p>
|
||||
</div>
|
||||
|
||||
<div class="row g-4">
|
||||
<div class="col-lg-4 col-md-6">
|
||||
<div class="h-100 p-4 rounded-3" style="background: rgba(255,255,255,0.1); border: 1px solid rgba(255,255,255,0.15);">
|
||||
<div class="d-flex align-items-center mb-3">
|
||||
<div class="rounded-circle p-2 me-3" style="background: rgba(34, 197, 94, 0.2);">
|
||||
<svg xmlns="http://www.w3.org/2000/svg" width="24" height="24" fill="#22C55E" viewBox="0 0 16 16">
|
||||
<path d="M2.5 8a5.5 5.5 0 0 1 8.25-4.764.5.5 0 0 0 .5-.866A6.5 6.5 0 1 0 14.5 8a.5.5 0 0 0-1 0 5.5 5.5 0 1 1-11 0z"/>
|
||||
<path d="M15.354 3.354a.5.5 0 0 0-.708-.708L8 9.293 5.354 6.646a.5.5 0 1 0-.708.708l3 3a.5.5 0 0 0 .708 0l7-7z"/>
|
||||
</svg>
|
||||
</div>
|
||||
<h5 class="fw-bold text-white mb-0">Reduce Poor Appointments</h5>
|
||||
</div>
|
||||
<p class="mb-0" style="color: rgba(255,255,255,0.85);">
|
||||
Studies show 30-40% of CVs contain inaccuracies. Catch embellishments and false claims before they become costly recruitment mistakes.
|
||||
</p>
|
||||
</div>
|
||||
</div>
|
||||
|
||||
<div class="col-lg-4 col-md-6">
|
||||
<div class="h-100 p-4 rounded-3" style="background: rgba(255,255,255,0.1); border: 1px solid rgba(255,255,255,0.15);">
|
||||
<div class="d-flex align-items-center mb-3">
|
||||
<div class="rounded-circle p-2 me-3" style="background: rgba(59, 130, 246, 0.2);">
|
||||
<svg xmlns="http://www.w3.org/2000/svg" width="24" height="24" fill="#3B82F6" viewBox="0 0 16 16">
|
||||
<path d="M4 .5a.5.5 0 0 0-1 0V1H2a2 2 0 0 0-2 2v1h16V3a2 2 0 0 0-2-2h-1V.5a.5.5 0 0 0-1 0V1H4V.5zM16 14V5H0v9a2 2 0 0 0 2 2h12a2 2 0 0 0 2-2zM9.5 7h1a.5.5 0 0 1 .5.5v1a.5.5 0 0 1-.5.5h-1a.5.5 0 0 1-.5-.5v-1a.5.5 0 0 1 .5-.5zm3 0h1a.5.5 0 0 1 .5.5v1a.5.5 0 0 1-.5.5h-1a.5.5 0 0 1-.5-.5v-1a.5.5 0 0 1 .5-.5zM2 10.5a.5.5 0 0 1 .5-.5h1a.5.5 0 0 1 .5.5v1a.5.5 0 0 1-.5.5h-1a.5.5 0 0 1-.5-.5v-1zm3.5-.5h1a.5.5 0 0 1 .5.5v1a.5.5 0 0 1-.5.5h-1a.5.5 0 0 1-.5-.5v-1a.5.5 0 0 1 .5-.5z"/>
|
||||
</svg>
|
||||
</div>
|
||||
<h5 class="fw-bold text-white mb-0">Save Time</h5>
|
||||
</div>
|
||||
<p class="mb-0" style="color: rgba(255,255,255,0.85);">
|
||||
Get comprehensive verification reports in minutes, not days. No more manual reference checking or waiting for background check results.
|
||||
</p>
|
||||
</div>
|
||||
</div>
|
||||
|
||||
<div class="col-lg-4 col-md-6">
|
||||
<div class="h-100 p-4 rounded-3" style="background: rgba(255,255,255,0.1); border: 1px solid rgba(255,255,255,0.15);">
|
||||
<div class="d-flex align-items-center mb-3">
|
||||
<div class="rounded-circle p-2 me-3" style="background: rgba(168, 85, 247, 0.2);">
|
||||
<svg xmlns="http://www.w3.org/2000/svg" width="24" height="24" fill="#A855F7" viewBox="0 0 16 16">
|
||||
<path d="M8 4.754a3.246 3.246 0 1 0 0 6.492 3.246 3.246 0 0 0 0-6.492zM5.754 8a2.246 2.246 0 1 1 4.492 0 2.246 2.246 0 0 1-4.492 0z"/>
|
||||
<path d="M9.796 1.343c-.527-1.79-3.065-1.79-3.592 0l-.094.319a.873.873 0 0 1-1.255.52l-.292-.16c-1.64-.892-3.433.902-2.54 2.541l.159.292a.873.873 0 0 1-.52 1.255l-.319.094c-1.79.527-1.79 3.065 0 3.592l.319.094a.873.873 0 0 1 .52 1.255l-.16.292c-.892 1.64.901 3.434 2.541 2.54l.292-.159a.873.873 0 0 1 1.255.52l.094.319c.527 1.79 3.065 1.79 3.592 0l.094-.319a.873.873 0 0 1 1.255-.52l.292.16c1.64.893 3.434-.902 2.54-2.541l-.159-.292a.873.873 0 0 1 .52-1.255l.319-.094c1.79-.527 1.79-3.065 0-3.592l-.319-.094a.873.873 0 0 1-.52-1.255l.16-.292c.893-1.64-.902-3.433-2.541-2.54l-.292.159a.873.873 0 0 1-1.255-.52l-.094-.319zm-2.633.283c.246-.835 1.428-.835 1.674 0l.094.319a1.873 1.873 0 0 0 2.693 1.115l.291-.16c.764-.415 1.6.42 1.184 1.185l-.159.292a1.873 1.873 0 0 0 1.116 2.692l.318.094c.835.246.835 1.428 0 1.674l-.319.094a1.873 1.873 0 0 0-1.115 2.693l.16.291c.415.764-.42 1.6-1.185 1.184l-.291-.159a1.873 1.873 0 0 0-2.693 1.116l-.094.318c-.246.835-1.428.835-1.674 0l-.094-.319a1.873 1.873 0 0 0-2.692-1.115l-.292.16c-.764.415-1.6-.42-1.184-1.185l.159-.291A1.873 1.873 0 0 0 1.945 8.93l-.319-.094c-.835-.246-.835-1.428 0-1.674l.319-.094A1.873 1.873 0 0 0 3.06 4.377l-.16-.292c-.415-.764.42-1.6 1.185-1.184l.292.159a1.873 1.873 0 0 0 2.692-1.115l.094-.319z"/>
|
||||
</svg>
|
||||
</div>
|
||||
<h5 class="fw-bold text-white mb-0">Official Data Sources</h5>
|
||||
</div>
|
||||
<p class="mb-0" style="color: rgba(255,255,255,0.85);">
|
||||
Verify against Companies House records, cross-reference incorporation dates, check company status, and validate director claims.
|
||||
</p>
|
||||
</div>
|
||||
</div>
|
||||
|
||||
<div class="col-lg-4 col-md-6">
|
||||
<div class="h-100 p-4 rounded-3" style="background: rgba(255,255,255,0.1); border: 1px solid rgba(255,255,255,0.15);">
|
||||
<div class="d-flex align-items-center mb-3">
|
||||
<div class="rounded-circle p-2 me-3" style="background: rgba(249, 115, 22, 0.2);">
|
||||
<svg xmlns="http://www.w3.org/2000/svg" width="24" height="24" fill="#F97316" viewBox="0 0 16 16">
|
||||
<path d="M8 15A7 7 0 1 1 8 1a7 7 0 0 1 0 14zm0 1A8 8 0 1 0 8 0a8 8 0 0 0 0 16z"/>
|
||||
<path d="M8 4a.5.5 0 0 1 .5.5v3h3a.5.5 0 0 1 0 1h-3v3a.5.5 0 0 1-1 0v-3h-3a.5.5 0 0 1 0-1h3v-3A.5.5 0 0 1 8 4z"/>
|
||||
</svg>
|
||||
</div>
|
||||
<h5 class="fw-bold text-white mb-0">Detailed Reports</h5>
|
||||
</div>
|
||||
<p class="mb-0" style="color: rgba(255,255,255,0.85);">
|
||||
Get actionable insights with employment verification scores, timeline analysis, education checks, and specific flags for areas of concern.
|
||||
</p>
|
||||
</div>
|
||||
</div>
|
||||
|
||||
<div class="col-lg-4 col-md-6">
|
||||
<div class="h-100 p-4 rounded-3" style="background: rgba(255,255,255,0.1); border: 1px solid rgba(255,255,255,0.15);">
|
||||
<div class="d-flex align-items-center mb-3">
|
||||
<div class="rounded-circle p-2 me-3" style="background: rgba(236, 72, 153, 0.2);">
|
||||
<svg xmlns="http://www.w3.org/2000/svg" width="24" height="24" fill="#EC4899" viewBox="0 0 16 16">
|
||||
<path d="M8 1a2 2 0 0 1 2 2v4H6V3a2 2 0 0 1 2-2zm3 6V3a3 3 0 0 0-6 0v4a2 2 0 0 0-2 2v5a2 2 0 0 0 2 2h6a2 2 0 0 0 2-2V9a2 2 0 0 0-2-2z"/>
|
||||
</svg>
|
||||
</div>
|
||||
<h5 class="fw-bold text-white mb-0">GDPR Compliant</h5>
|
||||
</div>
|
||||
<p class="mb-0" style="color: rgba(255,255,255,0.85);">
|
||||
CVs are deleted immediately after processing. Data is automatically purged after 30 days. Your candidates' privacy is protected.
|
||||
</p>
|
||||
</div>
|
||||
</div>
|
||||
|
||||
<div class="col-lg-4 col-md-6">
|
||||
<div class="h-100 p-4 rounded-3" style="background: rgba(255,255,255,0.1); border: 1px solid rgba(255,255,255,0.15);">
|
||||
<div class="d-flex align-items-center mb-3">
|
||||
<div class="rounded-circle p-2 me-3" style="background: rgba(20, 184, 166, 0.2);">
|
||||
<svg xmlns="http://www.w3.org/2000/svg" width="24" height="24" fill="#14B8A6" viewBox="0 0 16 16">
|
||||
<path d="M0 4a2 2 0 0 1 2-2h12a2 2 0 0 1 2 2v8a2 2 0 0 1-2 2H2a2 2 0 0 1-2-2V4zm2-1a1 1 0 0 0-1 1v.217l7 4.2 7-4.2V4a1 1 0 0 0-1-1H2zm13 2.383-4.708 2.825L15 11.105V5.383zm-.034 6.876-5.64-3.471L8 9.583l-1.326-.795-5.64 3.47A1 1 0 0 0 2 13h12a1 1 0 0 0 .966-.741zM1 11.105l4.708-2.897L1 5.383v5.722z"/>
|
||||
</svg>
|
||||
</div>
|
||||
<h5 class="fw-bold text-white mb-0">UK Specialist</h5>
|
||||
</div>
|
||||
<p class="mb-0" style="color: rgba(255,255,255,0.85);">
|
||||
Purpose-built for UK recruitment with support for NHS, councils, public sector employers, charities, and Companies House registered businesses.
|
||||
</p>
|
||||
</div>
|
||||
</div>
|
||||
</div>
|
||||
|
||||
<div class="text-center mt-5">
|
||||
<a href="/pricing" class="btn btn-lg px-5 py-3" style="background: white; color: #1e3a5f; font-weight: 600;">
|
||||
View Pricing Plans
|
||||
<svg xmlns="http://www.w3.org/2000/svg" width="16" height="16" fill="currentColor" class="ms-2" viewBox="0 0 16 16">
|
||||
<path fill-rule="evenodd" d="M1 8a.5.5 0 0 1 .5-.5h11.793l-3.147-3.146a.5.5 0 0 1 .708-.708l4 4a.5.5 0 0 1 0 .708l-4 4a.5.5 0 0 1-.708-.708L13.293 8.5H1.5A.5.5 0 0 1 1 8z"/>
|
||||
</svg>
|
||||
</a>
|
||||
</div>
|
||||
</div>
|
||||
</section>
|
||||
|
||||
<!-- Trust indicators -->
|
||||
<section class="py-4" style="background-color: var(--realcv-bg-muted); border-top: 1px solid var(--realcv-gray-200);">
|
||||
<div class="container">
|
||||
|
||||
@@ -11,7 +11,7 @@
|
||||
<div class="text-center mb-5">
|
||||
<h1 class="fw-bold mb-3">Simple, Transparent Pricing</h1>
|
||||
<p class="text-muted lead mb-0" style="max-width: 600px; margin: 0 auto;">
|
||||
Choose the plan that fits your hiring needs. All plans include our core CV verification technology.
|
||||
Choose the plan that fits your recruitment needs. All plans include our core CV verification technology.
|
||||
</p>
|
||||
</div>
|
||||
|
||||
@@ -69,9 +69,7 @@
|
||||
|
||||
@if (_currentPlan == "Free")
|
||||
{
|
||||
<button class="btn btn-outline-secondary w-100 py-2" disabled>
|
||||
Current Plan
|
||||
</button>
|
||||
<span class="text-muted small d-block text-center">Your current plan</span>
|
||||
}
|
||||
else
|
||||
{
|
||||
@@ -85,7 +83,7 @@
|
||||
|
||||
<!-- Professional Plan -->
|
||||
<div class="col-lg-4 col-md-6">
|
||||
<div class="card border-0 shadow h-100 position-relative @(_currentPlan == "Professional" ? "border-primary border-2" : "")">
|
||||
<div class="card shadow-lg h-100 position-relative @(_currentPlan == "Professional" ? "border-primary border-2" : "border-primary")" style="@(_currentPlan != "Professional" ? "border-width: 2px !important;" : "")">
|
||||
@if (_currentPlan == "Professional")
|
||||
{
|
||||
<div class="card-header bg-primary text-white text-center py-2 border-0">
|
||||
@@ -209,15 +207,13 @@
|
||||
|
||||
@if (_currentPlan == "Enterprise")
|
||||
{
|
||||
<button class="btn btn-outline-secondary w-100 py-2" disabled>
|
||||
Current Plan
|
||||
</button>
|
||||
<span class="text-muted small d-block text-center">Your current plan</span>
|
||||
}
|
||||
else
|
||||
{
|
||||
<form action="/api/billing/create-checkout" method="post">
|
||||
<input type="hidden" name="plan" value="Enterprise" />
|
||||
<button type="submit" class="btn btn-dark w-100 py-2 fw-semibold" disabled="@(!_isAuthenticated)">
|
||||
<button type="submit" class="btn btn-outline-primary w-100 py-2 fw-semibold" disabled="@(!_isAuthenticated)">
|
||||
@if (_isAuthenticated)
|
||||
{
|
||||
<span>Upgrade to Enterprise</span>
|
||||
|
||||
124
src/RealCV.Web/Components/Pages/Privacy.razor
Normal file
@@ -0,0 +1,124 @@
|
||||
@page "/privacy"
|
||||
|
||||
<PageTitle>Privacy Policy - RealCV</PageTitle>
|
||||
|
||||
<div class="container py-5">
|
||||
<div class="row justify-content-center">
|
||||
<div class="col-lg-8">
|
||||
<h1 class="fw-bold mb-4">Privacy Policy</h1>
|
||||
<p class="text-muted mb-5">Last updated: @DateTime.Now.ToString("MMMM yyyy")</p>
|
||||
|
||||
<div class="card mb-4">
|
||||
<div class="card-body p-4">
|
||||
<h2 class="h4 fw-bold mb-3">
|
||||
<svg xmlns="http://www.w3.org/2000/svg" width="24" height="24" fill="currentColor" class="text-primary me-2" viewBox="0 0 16 16">
|
||||
<path d="M8 16s6-5.686 6-10A6 6 0 0 0 2 6c0 4.314 6 10 6 10zm0-7a3 3 0 1 1 0-6 3 3 0 0 1 0 6z"/>
|
||||
</svg>
|
||||
GDPR Compliance
|
||||
</h2>
|
||||
<p>
|
||||
RealCV is committed to protecting your privacy and complying with the General Data Protection Regulation (GDPR).
|
||||
This policy explains how we collect, use, and protect personal data.
|
||||
</p>
|
||||
</div>
|
||||
</div>
|
||||
|
||||
<h3 class="h5 fw-bold mt-4 mb-3">Data We Collect</h3>
|
||||
<p>When you use RealCV, we collect:</p>
|
||||
<ul class="mb-4">
|
||||
<li><strong>Account Information:</strong> Email address and password (hashed) when you register</li>
|
||||
<li><strong>CV Data:</strong> When you upload a CV for verification, we temporarily process the document to extract employment and education information</li>
|
||||
<li><strong>Verification Results:</strong> The analysis results and veracity scores generated from CV checks</li>
|
||||
</ul>
|
||||
|
||||
<h3 class="h5 fw-bold mt-4 mb-3">How We Use Your Data</h3>
|
||||
<ul class="mb-4">
|
||||
<li>To provide CV verification services</li>
|
||||
<li>To generate veracity reports</li>
|
||||
<li>To maintain your account and subscription</li>
|
||||
<li>To improve our services</li>
|
||||
</ul>
|
||||
|
||||
<div class="alert alert-info mb-4">
|
||||
<h4 class="h6 fw-bold mb-2">
|
||||
<svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" fill="currentColor" class="me-2" viewBox="0 0 16 16">
|
||||
<path d="M8 15A7 7 0 1 1 8 1a7 7 0 0 1 0 14zm0 1A8 8 0 1 0 8 0a8 8 0 0 0 0 16z"/>
|
||||
<path d="m8.93 6.588-2.29.287-.082.38.45.083c.294.07.352.176.288.469l-.738 3.468c-.194.897.105 1.319.808 1.319.545 0 1.178-.252 1.465-.598l.088-.416c-.2.176-.492.246-.686.246-.275 0-.375-.193-.304-.533L8.93 6.588zM9 4.5a1 1 0 1 1-2 0 1 1 0 0 1 2 0z"/>
|
||||
</svg>
|
||||
Important: CV File Handling
|
||||
</h4>
|
||||
<p class="mb-0">
|
||||
<strong>Uploaded CV files are automatically deleted immediately after processing.</strong>
|
||||
We do not retain the original CV documents. Only the extracted verification data and reports are stored temporarily.
|
||||
</p>
|
||||
</div>
|
||||
|
||||
<h3 class="h5 fw-bold mt-4 mb-3">Data Retention</h3>
|
||||
<p>
|
||||
We retain CV check data for a maximum of <strong>30 days</strong> after completion.
|
||||
After this period, all associated data is automatically and permanently deleted.
|
||||
</p>
|
||||
<p>You can also manually delete your CV check data at any time from your dashboard.</p>
|
||||
|
||||
<h3 class="h5 fw-bold mt-4 mb-3">Your Rights Under GDPR</h3>
|
||||
<p>You have the following rights regarding your personal data:</p>
|
||||
<div class="row g-3 mb-4">
|
||||
<div class="col-md-6">
|
||||
<div class="border rounded p-3 h-100">
|
||||
<strong>Right to Access</strong>
|
||||
<p class="mb-0 small text-muted">View all data we hold about you</p>
|
||||
</div>
|
||||
</div>
|
||||
<div class="col-md-6">
|
||||
<div class="border rounded p-3 h-100">
|
||||
<strong>Right to Erasure</strong>
|
||||
<p class="mb-0 small text-muted">Request deletion of your data</p>
|
||||
</div>
|
||||
</div>
|
||||
<div class="col-md-6">
|
||||
<div class="border rounded p-3 h-100">
|
||||
<strong>Right to Rectification</strong>
|
||||
<p class="mb-0 small text-muted">Correct inaccurate personal data</p>
|
||||
</div>
|
||||
</div>
|
||||
<div class="col-md-6">
|
||||
<div class="border rounded p-3 h-100">
|
||||
<strong>Right to Portability</strong>
|
||||
<p class="mb-0 small text-muted">Export your data in a standard format</p>
|
||||
</div>
|
||||
</div>
|
||||
</div>
|
||||
|
||||
<h3 class="h5 fw-bold mt-4 mb-3">Data Security</h3>
|
||||
<ul class="mb-4">
|
||||
<li>All data is encrypted in transit using TLS/HTTPS</li>
|
||||
<li>Passwords are hashed using industry-standard algorithms</li>
|
||||
<li>CV files are deleted immediately after processing</li>
|
||||
<li>Access to data is restricted to authorised personnel only</li>
|
||||
</ul>
|
||||
|
||||
<h3 class="h5 fw-bold mt-4 mb-3">Third-Party Services</h3>
|
||||
<p>We use the following third-party services:</p>
|
||||
<ul class="mb-4">
|
||||
<li><strong>Companies House API:</strong> To verify UK company information (public data)</li>
|
||||
<li><strong>Anthropic Claude:</strong> For AI-powered CV parsing (data is processed in accordance with Anthropic's privacy policy)</li>
|
||||
<li><strong>Stripe:</strong> For payment processing (we do not store payment card details)</li>
|
||||
</ul>
|
||||
|
||||
<h3 class="h5 fw-bold mt-4 mb-3">Contact Us</h3>
|
||||
<p>
|
||||
If you have any questions about this privacy policy or wish to exercise your data rights,
|
||||
please contact us through your account dashboard or by email.
|
||||
</p>
|
||||
|
||||
<div class="mt-5 pt-4 border-top">
|
||||
<a href="/" class="btn btn-outline-primary">
|
||||
<svg xmlns="http://www.w3.org/2000/svg" width="16" height="16" fill="currentColor" class="me-2" viewBox="0 0 16 16">
|
||||
<path fill-rule="evenodd" d="M15 8a.5.5 0 0 0-.5-.5H2.707l3.147-3.146a.5.5 0 1 0-.708-.708l-4 4a.5.5 0 0 0 0 .708l4 4a.5.5 0 0 0 .708-.708L2.707 8.5H14.5A.5.5 0 0 0 15 8z"/>
|
||||
</svg>
|
||||
Back to Home
|
||||
</a>
|
||||
</div>
|
||||
</div>
|
||||
</div>
|
||||
</div>
|
||||
@@ -74,7 +74,7 @@
|
||||
<path d="M7.002 12a1 1 0 1 1 2 0 1 1 0 0 1-2 0zM7.1 5.995a.905.905 0 1 1 1.8 0l-.35 3.507a.552.552 0 0 1-1.1 0L7.1 5.995z"/>
|
||||
</svg>
|
||||
<h4 class="mb-2">Processing Failed</h4>
|
||||
<p class="text-muted">We encountered an error processing your CV. Please try uploading again.</p>
|
||||
<p class="text-muted">@(!string.IsNullOrEmpty(_check.ProcessingStage) ? _check.ProcessingStage : "We encountered an error processing your CV. Please try uploading again.")</p>
|
||||
}
|
||||
|
||||
<p class="text-muted small mt-4">
|
||||
|
||||
@@ -169,12 +169,20 @@ try
|
||||
});
|
||||
}
|
||||
|
||||
// Schedule recurring job to reset monthly usage
|
||||
// Schedule recurring jobs
|
||||
var recurringJobManager = app.Services.GetRequiredService<IRecurringJobManager>();
|
||||
|
||||
// Reset monthly usage at 00:05 UTC daily
|
||||
recurringJobManager.AddOrUpdate<RealCV.Infrastructure.Jobs.ResetMonthlyUsageJob>(
|
||||
"reset-monthly-usage",
|
||||
job => job.ExecuteAsync(CancellationToken.None),
|
||||
Cron.Daily(0, 5)); // Run at 00:05 UTC daily
|
||||
Cron.Daily(0, 5));
|
||||
|
||||
// GDPR: Run data retention cleanup at 02:00 UTC daily
|
||||
recurringJobManager.AddOrUpdate<RealCV.Infrastructure.Jobs.DataRetentionJob>(
|
||||
"gdpr-data-retention",
|
||||
job => job.ExecuteAsync(CancellationToken.None),
|
||||
Cron.Daily(2, 0));
|
||||
|
||||
// Login endpoint
|
||||
app.MapPost("/account/perform-login", async (
|
||||
|
||||
@@ -43,7 +43,7 @@ public class PdfReportService : IPdfReportService
|
||||
{
|
||||
row.RelativeItem().Column(col =>
|
||||
{
|
||||
col.Item().Text("TrueCV").Bold().FontSize(24).FontColor(Colors.Blue.Darken2);
|
||||
col.Item().Text("RealCV").Bold().FontSize(24).FontColor(Colors.Blue.Darken2);
|
||||
col.Item().Text("CV Verification Report").FontSize(14).FontColor(Colors.Grey.Darken1);
|
||||
});
|
||||
row.ConstantItem(100).AlignRight().Column(col =>
|
||||
@@ -62,7 +62,7 @@ public class PdfReportService : IPdfReportService
|
||||
row.ConstantItem(120).Border(2).BorderColor(scoreColor).Padding(10).AlignCenter().Column(col =>
|
||||
{
|
||||
col.Item().AlignCenter().Text(report.OverallScore.ToString()).Bold().FontSize(28).FontColor(scoreColor);
|
||||
col.Item().AlignCenter().Text("TrueCV Score").FontSize(10).FontColor(scoreColor);
|
||||
col.Item().AlignCenter().Text("RealCV Score").FontSize(10).FontColor(scoreColor);
|
||||
});
|
||||
});
|
||||
|
||||
@@ -239,7 +239,7 @@ public class PdfReportService : IPdfReportService
|
||||
{
|
||||
row.RelativeItem().Column(col =>
|
||||
{
|
||||
col.Item().Text("TrueCV").Bold().FontSize(24).FontColor(Colors.Blue.Darken2);
|
||||
col.Item().Text("RealCV").Bold().FontSize(24).FontColor(Colors.Blue.Darken2);
|
||||
col.Item().Text("CV Verification Report Summary").FontSize(14).FontColor(Colors.Grey.Darken1);
|
||||
});
|
||||
row.ConstantItem(100).AlignRight().Text(DateTime.Now.ToString("dd MMM yyyy")).FontSize(10).FontColor(Colors.Grey.Medium);
|
||||
@@ -306,7 +306,7 @@ public class PdfReportService : IPdfReportService
|
||||
column.Item().LineHorizontal(1).LineColor(Colors.Grey.Lighten2);
|
||||
column.Item().PaddingTop(10).Row(row =>
|
||||
{
|
||||
row.RelativeItem().Text("Generated by TrueCV - CV Verification Platform").FontSize(8).FontColor(Colors.Grey.Medium);
|
||||
row.RelativeItem().Text("Generated by RealCV - CV Verification Platform").FontSize(8).FontColor(Colors.Grey.Medium);
|
||||
row.RelativeItem().AlignRight().Text(x =>
|
||||
{
|
||||
x.Span("Page ").FontSize(8).FontColor(Colors.Grey.Medium);
|
||||
|
||||
@@ -3,6 +3,9 @@
|
||||
"DefaultConnection": "Server=.;Database=RealCV;Trusted_Connection=True;TrustServerCertificate=True;",
|
||||
"HangfireConnection": "Server=.;Database=RealCV_Hangfire;Trusted_Connection=True;TrustServerCertificate=True;"
|
||||
},
|
||||
"DataRetention": {
|
||||
"CVCheckRetentionDays": 30
|
||||
},
|
||||
"CompaniesHouse": {
|
||||
"BaseUrl": "https://api.company-information.service.gov.uk",
|
||||
"ApiKey": ""
|
||||
|
||||
@@ -30,7 +30,7 @@
|
||||
--realcv-info: #0EA5E9; /* Sky Blue */
|
||||
--realcv-info-light: #E0F2FE;
|
||||
|
||||
--realcv-accent: var(--realcv-accent); /* Light Blue - accent for dark backgrounds */
|
||||
--realcv-accent: #60A5FA; /* Light Blue - accent for dark backgrounds */
|
||||
|
||||
--realcv-neutral: #64748B; /* Slate */
|
||||
--realcv-neutral-light: #F1F5F9;
|
||||
@@ -1051,8 +1051,12 @@ h1:focus {
|
||||
}
|
||||
|
||||
.auth-logo {
|
||||
height: 48px;
|
||||
margin-bottom: 1rem;
|
||||
height: 60px;
|
||||
transition: opacity var(--realcv-transition);
|
||||
}
|
||||
|
||||
.auth-logo:hover {
|
||||
opacity: 0.85;
|
||||
}
|
||||
|
||||
.auth-title {
|
||||
@@ -1116,7 +1120,7 @@ h1:focus {
|
||||
|
||||
.auth-stat-label {
|
||||
font-size: 0.875rem;
|
||||
color: rgba(255, 255, 255, 0.8);
|
||||
color: rgba(255, 255, 255, 0.9);
|
||||
margin-top: 0.25rem;
|
||||
}
|
||||
|
||||
@@ -1137,7 +1141,7 @@ h1:focus {
|
||||
|
||||
.auth-testimonial cite {
|
||||
font-size: 0.875rem;
|
||||
color: rgba(255, 255, 255, 0.8);
|
||||
color: rgba(255, 255, 255, 0.85);
|
||||
font-style: normal;
|
||||
}
|
||||
|
||||
|
||||
319
tests/RealCV.Tests/Integration/CVBatchTester.cs
Normal file
@@ -0,0 +1,319 @@
|
||||
using System.Text.Json;
|
||||
using Microsoft.EntityFrameworkCore;
|
||||
using Microsoft.Extensions.Configuration;
|
||||
using Microsoft.Extensions.DependencyInjection;
|
||||
using Microsoft.Extensions.Logging;
|
||||
using RealCV.Application.Interfaces;
|
||||
using RealCV.Application.Models;
|
||||
using RealCV.Infrastructure.Data;
|
||||
using RealCV.Infrastructure.ExternalApis;
|
||||
using RealCV.Infrastructure.Services;
|
||||
using RealCV.Infrastructure.Configuration;
|
||||
|
||||
namespace RealCV.Tests.Integration;
|
||||
|
||||
/// <summary>
|
||||
/// Test utility to batch process CVs and output verification findings.
|
||||
/// Run with: dotnet test --filter "FullyQualifiedName~CVBatchTester" -- TestRunParameters.Parameter(name=\"CvFolder\", value=\"/path/to/cvs\")
|
||||
/// Or use the ProcessFolder method directly.
|
||||
/// </summary>
|
||||
public class CVBatchTester
|
||||
{
|
||||
private readonly IServiceProvider _serviceProvider;
|
||||
|
||||
public CVBatchTester()
|
||||
{
|
||||
var services = new ServiceCollection();
|
||||
ConfigureServices(services);
|
||||
_serviceProvider = services.BuildServiceProvider();
|
||||
}
|
||||
|
||||
private static void ConfigureServices(IServiceCollection services)
|
||||
{
|
||||
// Load configuration
|
||||
var configuration = new ConfigurationBuilder()
|
||||
.SetBasePath(Directory.GetCurrentDirectory())
|
||||
.AddJsonFile("appsettings.json", optional: true)
|
||||
.AddJsonFile("appsettings.Development.json", optional: true)
|
||||
.AddEnvironmentVariables()
|
||||
.Build();
|
||||
|
||||
// Logging
|
||||
services.AddLogging(builder =>
|
||||
{
|
||||
builder.AddConsole();
|
||||
builder.SetMinimumLevel(LogLevel.Information);
|
||||
});
|
||||
|
||||
// Database
|
||||
var connectionString = configuration.GetConnectionString("DefaultConnection")
|
||||
?? "Server=127.0.0.1;Database=RealCV;User Id=SA;Password=TrueCV_Sql2024!;TrustServerCertificate=True";
|
||||
|
||||
services.AddDbContextFactory<ApplicationDbContext>(options =>
|
||||
options.UseSqlServer(connectionString));
|
||||
|
||||
// Companies House
|
||||
services.Configure<CompaniesHouseSettings>(configuration.GetSection("CompaniesHouse"));
|
||||
services.AddHttpClient<CompaniesHouseClient>();
|
||||
|
||||
// Anthropic (for AI matching)
|
||||
services.Configure<AnthropicSettings>(configuration.GetSection("Anthropic"));
|
||||
services.AddScoped<ICompanyNameMatcherService, AICompanyNameMatcherService>();
|
||||
|
||||
// Services
|
||||
services.AddScoped<ICompanyVerifierService, CompanyVerifierService>();
|
||||
services.AddScoped<IEducationVerifierService, EducationVerifierService>();
|
||||
services.AddScoped<ICVParserService, CVParserService>();
|
||||
}
|
||||
|
||||
/// <summary>
|
||||
/// Process all CVs in a folder and return verification results.
|
||||
/// </summary>
|
||||
public async Task<List<CVVerificationSummary>> ProcessFolderAsync(string folderPath)
|
||||
{
|
||||
if (!Directory.Exists(folderPath))
|
||||
{
|
||||
throw new DirectoryNotFoundException($"Folder not found: {folderPath}");
|
||||
}
|
||||
|
||||
var cvFiles = Directory.GetFiles(folderPath, "*.*", SearchOption.TopDirectoryOnly)
|
||||
.Where(f => f.EndsWith(".pdf", StringComparison.OrdinalIgnoreCase) ||
|
||||
f.EndsWith(".docx", StringComparison.OrdinalIgnoreCase) ||
|
||||
f.EndsWith(".doc", StringComparison.OrdinalIgnoreCase))
|
||||
.ToList();
|
||||
|
||||
Console.WriteLine($"Found {cvFiles.Count} CV files in {folderPath}");
|
||||
Console.WriteLine(new string('=', 80));
|
||||
|
||||
var results = new List<CVVerificationSummary>();
|
||||
|
||||
foreach (var cvFile in cvFiles)
|
||||
{
|
||||
Console.WriteLine($"\nProcessing: {Path.GetFileName(cvFile)}");
|
||||
Console.WriteLine(new string('-', 60));
|
||||
|
||||
try
|
||||
{
|
||||
var result = await ProcessSingleCVAsync(cvFile);
|
||||
results.Add(result);
|
||||
PrintSummary(result);
|
||||
}
|
||||
catch (Exception ex)
|
||||
{
|
||||
Console.WriteLine($"ERROR: {ex.Message}");
|
||||
results.Add(new CVVerificationSummary
|
||||
{
|
||||
FileName = Path.GetFileName(cvFile),
|
||||
Error = ex.Message
|
||||
});
|
||||
}
|
||||
}
|
||||
|
||||
// Print overall summary
|
||||
Console.WriteLine("\n" + new string('=', 80));
|
||||
Console.WriteLine("OVERALL SUMMARY");
|
||||
Console.WriteLine(new string('=', 80));
|
||||
PrintOverallSummary(results);
|
||||
|
||||
return results;
|
||||
}
|
||||
|
||||
private async Task<CVVerificationSummary> ProcessSingleCVAsync(string filePath)
|
||||
{
|
||||
using var scope = _serviceProvider.CreateScope();
|
||||
var cvParser = scope.ServiceProvider.GetRequiredService<ICVParserService>();
|
||||
var companyVerifier = scope.ServiceProvider.GetRequiredService<ICompanyVerifierService>();
|
||||
var educationVerifier = scope.ServiceProvider.GetRequiredService<IEducationVerifierService>();
|
||||
|
||||
// Parse the CV
|
||||
await using var fileStream = File.OpenRead(filePath);
|
||||
var parsedCV = await cvParser.ParseAsync(fileStream, Path.GetFileName(filePath));
|
||||
|
||||
var summary = new CVVerificationSummary
|
||||
{
|
||||
FileName = Path.GetFileName(filePath),
|
||||
CandidateName = parsedCV.FullName ?? "Unknown"
|
||||
};
|
||||
|
||||
// Verify employers
|
||||
if (parsedCV.Employment?.Count > 0)
|
||||
{
|
||||
foreach (var employment in parsedCV.Employment)
|
||||
{
|
||||
try
|
||||
{
|
||||
var result = await companyVerifier.VerifyCompanyAsync(
|
||||
employment.CompanyName,
|
||||
employment.StartDate,
|
||||
employment.EndDate,
|
||||
employment.JobTitle);
|
||||
|
||||
summary.EmployerResults.Add(new EmployerVerificationSummary
|
||||
{
|
||||
ClaimedName = employment.CompanyName,
|
||||
MatchedName = result.MatchedCompanyName,
|
||||
CompanyNumber = result.MatchedCompanyNumber,
|
||||
IsVerified = result.IsVerified,
|
||||
MatchScore = result.MatchScore,
|
||||
Notes = result.VerificationNotes,
|
||||
Status = result.CompanyStatus
|
||||
});
|
||||
}
|
||||
catch (Exception ex)
|
||||
{
|
||||
summary.EmployerResults.Add(new EmployerVerificationSummary
|
||||
{
|
||||
ClaimedName = employment.CompanyName,
|
||||
IsVerified = false,
|
||||
Notes = $"Error: {ex.Message}"
|
||||
});
|
||||
}
|
||||
}
|
||||
}
|
||||
|
||||
// Verify education
|
||||
if (parsedCV.Education?.Count > 0)
|
||||
{
|
||||
var educationResults = educationVerifier.VerifyAll(
|
||||
parsedCV.Education.Select(e => new EducationEntry
|
||||
{
|
||||
Institution = e.Institution,
|
||||
Qualification = e.Qualification,
|
||||
Subject = e.Subject,
|
||||
StartDate = e.StartDate,
|
||||
EndDate = e.EndDate
|
||||
}).ToList());
|
||||
|
||||
foreach (var result in educationResults)
|
||||
{
|
||||
summary.EducationResults.Add(new EducationVerificationSummary
|
||||
{
|
||||
ClaimedInstitution = result.ClaimedInstitution,
|
||||
MatchedInstitution = result.MatchedInstitution,
|
||||
Qualification = result.ClaimedQualification,
|
||||
IsVerified = result.IsVerified,
|
||||
Status = result.Status,
|
||||
Notes = result.VerificationNotes
|
||||
});
|
||||
}
|
||||
}
|
||||
|
||||
return summary;
|
||||
}
|
||||
|
||||
private static void PrintSummary(CVVerificationSummary summary)
|
||||
{
|
||||
Console.WriteLine($"Candidate: {summary.CandidateName}");
|
||||
|
||||
Console.WriteLine($"\n EMPLOYERS ({summary.EmployerResults.Count}):");
|
||||
foreach (var emp in summary.EmployerResults)
|
||||
{
|
||||
var status = emp.IsVerified ? "✓" : "✗";
|
||||
var matchInfo = emp.IsVerified
|
||||
? $"-> {emp.MatchedName} ({emp.MatchScore}%)"
|
||||
: emp.Notes ?? "Not found";
|
||||
Console.WriteLine($" {status} {emp.ClaimedName}");
|
||||
Console.WriteLine($" {matchInfo}");
|
||||
}
|
||||
|
||||
Console.WriteLine($"\n EDUCATION ({summary.EducationResults.Count}):");
|
||||
foreach (var edu in summary.EducationResults)
|
||||
{
|
||||
var status = edu.IsVerified ? "✓" : "✗";
|
||||
var matchInfo = edu.IsVerified && edu.MatchedInstitution != null
|
||||
? $"-> {edu.MatchedInstitution}"
|
||||
: edu.Notes ?? edu.Status;
|
||||
Console.WriteLine($" {status} {edu.ClaimedInstitution}");
|
||||
Console.WriteLine($" {edu.Qualification}");
|
||||
Console.WriteLine($" {matchInfo}");
|
||||
}
|
||||
}
|
||||
|
||||
private static void PrintOverallSummary(List<CVVerificationSummary> results)
|
||||
{
|
||||
var successfulCVs = results.Count(r => r.Error == null);
|
||||
var totalEmployers = results.Sum(r => r.EmployerResults.Count);
|
||||
var verifiedEmployers = results.Sum(r => r.EmployerResults.Count(e => e.IsVerified));
|
||||
var totalEducation = results.Sum(r => r.EducationResults.Count);
|
||||
var verifiedEducation = results.Sum(r => r.EducationResults.Count(e => e.IsVerified));
|
||||
|
||||
Console.WriteLine($"CVs Processed: {successfulCVs}/{results.Count}");
|
||||
Console.WriteLine($"Employers: {verifiedEmployers}/{totalEmployers} verified ({(totalEmployers > 0 ? verifiedEmployers * 100 / totalEmployers : 0)}%)");
|
||||
Console.WriteLine($"Education: {verifiedEducation}/{totalEducation} verified ({(totalEducation > 0 ? verifiedEducation * 100 / totalEducation : 0)}%)");
|
||||
|
||||
// List unverified employers
|
||||
var unverifiedEmployers = results
|
||||
.SelectMany(r => r.EmployerResults.Where(e => !e.IsVerified))
|
||||
.GroupBy(e => e.ClaimedName)
|
||||
.OrderByDescending(g => g.Count())
|
||||
.ToList();
|
||||
|
||||
if (unverifiedEmployers.Count > 0)
|
||||
{
|
||||
Console.WriteLine($"\nUNVERIFIED EMPLOYERS ({unverifiedEmployers.Count} unique):");
|
||||
foreach (var group in unverifiedEmployers.Take(20))
|
||||
{
|
||||
Console.WriteLine($" - {group.Key} (x{group.Count()})");
|
||||
}
|
||||
}
|
||||
|
||||
// List unverified institutions
|
||||
var unverifiedEducation = results
|
||||
.SelectMany(r => r.EducationResults.Where(e => !e.IsVerified))
|
||||
.GroupBy(e => e.ClaimedInstitution)
|
||||
.OrderByDescending(g => g.Count())
|
||||
.ToList();
|
||||
|
||||
if (unverifiedEducation.Count > 0)
|
||||
{
|
||||
Console.WriteLine($"\nUNVERIFIED INSTITUTIONS ({unverifiedEducation.Count} unique):");
|
||||
foreach (var group in unverifiedEducation.Take(20))
|
||||
{
|
||||
Console.WriteLine($" - {group.Key} (x{group.Count()})");
|
||||
}
|
||||
}
|
||||
}
|
||||
|
||||
/// <summary>
|
||||
/// Export results to JSON for further analysis.
|
||||
/// </summary>
|
||||
public static void ExportToJson(List<CVVerificationSummary> results, string outputPath)
|
||||
{
|
||||
var json = JsonSerializer.Serialize(results, new JsonSerializerOptions
|
||||
{
|
||||
WriteIndented = true
|
||||
});
|
||||
File.WriteAllText(outputPath, json);
|
||||
Console.WriteLine($"\nResults exported to: {outputPath}");
|
||||
}
|
||||
}
|
||||
|
||||
public class CVVerificationSummary
|
||||
{
|
||||
public string FileName { get; set; } = "";
|
||||
public string CandidateName { get; set; } = "";
|
||||
public string? Error { get; set; }
|
||||
public List<EmployerVerificationSummary> EmployerResults { get; set; } = new();
|
||||
public List<EducationVerificationSummary> EducationResults { get; set; } = new();
|
||||
}
|
||||
|
||||
public class EmployerVerificationSummary
|
||||
{
|
||||
public string ClaimedName { get; set; } = "";
|
||||
public string? MatchedName { get; set; }
|
||||
public string? CompanyNumber { get; set; }
|
||||
public bool IsVerified { get; set; }
|
||||
public int MatchScore { get; set; }
|
||||
public string? Notes { get; set; }
|
||||
public string? Status { get; set; }
|
||||
}
|
||||
|
||||
public class EducationVerificationSummary
|
||||
{
|
||||
public string ClaimedInstitution { get; set; } = "";
|
||||
public string? MatchedInstitution { get; set; }
|
||||
public string? Qualification { get; set; }
|
||||
public bool IsVerified { get; set; }
|
||||
public string? Status { get; set; }
|
||||
public string? Notes { get; set; }
|
||||
}
|
||||
@@ -76,8 +76,9 @@ public class CompanyVerifierServiceTests : IDisposable
|
||||
_mockAiMatcher.Setup(m => m.FindBestMatchAsync(
|
||||
It.IsAny<string>(),
|
||||
It.IsAny<List<CompanyCandidate>>(),
|
||||
It.IsAny<string?>(),
|
||||
It.IsAny<CancellationToken>()))
|
||||
.Returns((string cvCompanyName, List<CompanyCandidate> candidates, CancellationToken _) =>
|
||||
.Returns((string cvCompanyName, List<CompanyCandidate> candidates, string? industryHint, CancellationToken _) =>
|
||||
{
|
||||
// Find exact or close match in candidates
|
||||
var exactMatch = candidates.FirstOrDefault(c =>
|
||||
|
||||
179
tests/RealCV.Tests/Services/CompoundNameDetectionTests.cs
Normal file
@@ -0,0 +1,179 @@
|
||||
using FluentAssertions;
|
||||
using Microsoft.Extensions.Logging.Abstractions;
|
||||
using Microsoft.Extensions.Options;
|
||||
using RealCV.Infrastructure.Configuration;
|
||||
using RealCV.Infrastructure.Services;
|
||||
|
||||
namespace RealCV.Tests.Services;
|
||||
|
||||
/// <summary>
|
||||
/// Tests for the rule-based compound company name detection.
|
||||
/// </summary>
|
||||
public sealed class CompoundNameDetectionTests
|
||||
{
|
||||
private readonly AICompanyNameMatcherService _sut;
|
||||
|
||||
public CompoundNameDetectionTests()
|
||||
{
|
||||
var settings = Options.Create(new AnthropicSettings { ApiKey = "test-key" });
|
||||
_sut = new AICompanyNameMatcherService(settings, NullLogger<AICompanyNameMatcherService>.Instance);
|
||||
}
|
||||
|
||||
#region Known Single Companies (should NOT be split)
|
||||
|
||||
[Theory]
|
||||
[InlineData("Ernst & Young")]
|
||||
[InlineData("Ernst and Young")]
|
||||
[InlineData("Marks & Spencer")]
|
||||
[InlineData("Marks and Spencer")]
|
||||
[InlineData("Procter & Gamble")]
|
||||
[InlineData("Johnson & Johnson")]
|
||||
[InlineData("Deloitte and Touche")]
|
||||
[InlineData("Allen & Overy")]
|
||||
[InlineData("Slaughter and May")]
|
||||
[InlineData("Holland & Barrett")]
|
||||
[InlineData("Smith & Nephew")]
|
||||
[InlineData("AT&T")]
|
||||
[InlineData("M&S")]
|
||||
public async Task ExtractCompanyNamesAsync_KnownSingleCompany_ReturnsNull(string companyName)
|
||||
{
|
||||
// Act
|
||||
var result = await _sut.ExtractCompanyNamesAsync(companyName);
|
||||
|
||||
// Assert
|
||||
result.Should().BeNull($"'{companyName}' is a known single company and should not be split");
|
||||
}
|
||||
|
||||
[Theory]
|
||||
[InlineData("Ernst & Young LLP")]
|
||||
[InlineData("Marks & Spencer PLC")]
|
||||
[InlineData("Procter & Gamble UK")]
|
||||
[InlineData("Johnson & Johnson Medical")]
|
||||
public async Task ExtractCompanyNamesAsync_KnownSingleCompanyWithSuffix_ReturnsNull(string companyName)
|
||||
{
|
||||
// Act
|
||||
var result = await _sut.ExtractCompanyNamesAsync(companyName);
|
||||
|
||||
// Assert
|
||||
result.Should().BeNull($"'{companyName}' contains a known single company and should not be split");
|
||||
}
|
||||
|
||||
#endregion
|
||||
|
||||
#region Department/Division Patterns (should NOT be split)
|
||||
|
||||
[Theory]
|
||||
[InlineData("Tesco Stores and Distribution")]
|
||||
[InlineData("BMW UK and Ireland")]
|
||||
[InlineData("Google Europe and Middle East")]
|
||||
[InlineData("Sales and Marketing")]
|
||||
[InlineData("Research and Development")]
|
||||
[InlineData("Finance and Operations")]
|
||||
public async Task ExtractCompanyNamesAsync_DepartmentPattern_ReturnsNull(string companyName)
|
||||
{
|
||||
// Act
|
||||
var result = await _sut.ExtractCompanyNamesAsync(companyName);
|
||||
|
||||
// Assert
|
||||
result.Should().BeNull($"'{companyName}' looks like departments/divisions and should not be split");
|
||||
}
|
||||
|
||||
#endregion
|
||||
|
||||
#region Compound Names with Slash (SHOULD be split)
|
||||
|
||||
[Theory]
|
||||
[InlineData("ASDA/WALMART", new[] { "ASDA", "WALMART" })]
|
||||
[InlineData("BBC/ITV", new[] { "BBC", "ITV" })]
|
||||
[InlineData("Tesco/Sainsbury's", new[] { "Tesco", "Sainsbury's" })]
|
||||
[InlineData("Microsoft/Google", new[] { "Microsoft", "Google" })]
|
||||
public async Task ExtractCompanyNamesAsync_SlashSeparated_ReturnsParts(string companyName, string[] expectedParts)
|
||||
{
|
||||
// Act
|
||||
var result = await _sut.ExtractCompanyNamesAsync(companyName);
|
||||
|
||||
// Assert
|
||||
result.Should().NotBeNull($"'{companyName}' contains '/' and should be split");
|
||||
result.Should().BeEquivalentTo(expectedParts);
|
||||
}
|
||||
|
||||
#endregion
|
||||
|
||||
#region Compound Names with And/Ampersand
|
||||
|
||||
[Theory]
|
||||
[InlineData("Acme Ltd & Beta Ltd", new[] { "Acme Ltd", "Beta Ltd" })]
|
||||
public async Task ExtractCompanyNamesAsync_BothPartsHaveCompanySuffix_ReturnsParts(string companyName, string[] expectedParts)
|
||||
{
|
||||
// When both parts clearly have company suffixes (Ltd, PLC, etc.), split them
|
||||
|
||||
// Act
|
||||
var result = await _sut.ExtractCompanyNamesAsync(companyName);
|
||||
|
||||
// Assert
|
||||
result.Should().NotBeNull($"'{companyName}' has company suffixes on both parts");
|
||||
result.Should().BeEquivalentTo(expectedParts);
|
||||
}
|
||||
|
||||
[Theory]
|
||||
[InlineData("Corus & Laura Ashley Hotels")] // Ambiguous - neither has company suffix
|
||||
[InlineData("Smith & Jones Consulting")] // Could be a single partnership
|
||||
[InlineData("Acme PLC and Beta PLC")] // Matches " plc and " department pattern
|
||||
public async Task ExtractCompanyNamesAsync_AmbiguousWithAnd_ReturnsNull(string companyName)
|
||||
{
|
||||
// Rule-based system is conservative with ambiguous & and "and" cases
|
||||
|
||||
// Act
|
||||
var result = await _sut.ExtractCompanyNamesAsync(companyName);
|
||||
|
||||
// Assert
|
||||
result.Should().BeNull($"'{companyName}' is ambiguous and should not be split");
|
||||
}
|
||||
|
||||
#endregion
|
||||
|
||||
#region Edge Cases
|
||||
|
||||
[Theory]
|
||||
[InlineData("")]
|
||||
[InlineData(" ")]
|
||||
[InlineData(null)]
|
||||
public async Task ExtractCompanyNamesAsync_EmptyOrNull_ReturnsNull(string? companyName)
|
||||
{
|
||||
// Act
|
||||
var result = await _sut.ExtractCompanyNamesAsync(companyName!);
|
||||
|
||||
// Assert
|
||||
result.Should().BeNull();
|
||||
}
|
||||
|
||||
[Theory]
|
||||
[InlineData("Microsoft")]
|
||||
[InlineData("Google")]
|
||||
[InlineData("Amazon")]
|
||||
[InlineData("Apple Inc")]
|
||||
[InlineData("Tesco PLC")]
|
||||
public async Task ExtractCompanyNamesAsync_SimpleCompanyName_ReturnsNull(string companyName)
|
||||
{
|
||||
// Act
|
||||
var result = await _sut.ExtractCompanyNamesAsync(companyName);
|
||||
|
||||
// Assert
|
||||
result.Should().BeNull($"'{companyName}' is a simple company name and should not be split");
|
||||
}
|
||||
|
||||
[Fact]
|
||||
public async Task ExtractCompanyNamesAsync_ShortParts_ReturnsNull()
|
||||
{
|
||||
// Arrange - Parts too short to be valid company names
|
||||
var companyName = "A & B";
|
||||
|
||||
// Act
|
||||
var result = await _sut.ExtractCompanyNamesAsync(companyName);
|
||||
|
||||
// Assert
|
||||
result.Should().BeNull("parts are too short to be valid company names");
|
||||
}
|
||||
|
||||
#endregion
|
||||
}
|
||||
@@ -51,7 +51,7 @@ public sealed class EducationVerifierServiceTests
|
||||
var result = _sut.Verify(education);
|
||||
|
||||
// Assert
|
||||
result.VerificationNotes.Should().Contain("diploma mill blacklist");
|
||||
result.VerificationNotes.Should().Contain("not found in accredited institutions");
|
||||
}
|
||||
|
||||
#endregion
|
||||
|
||||
15
tools/CVBatchTester/CVBatchTester.csproj
Normal file
@@ -0,0 +1,15 @@
|
||||
<Project Sdk="Microsoft.NET.Sdk">
|
||||
|
||||
<PropertyGroup>
|
||||
<OutputType>Exe</OutputType>
|
||||
<TargetFramework>net8.0</TargetFramework>
|
||||
<ImplicitUsings>enable</ImplicitUsings>
|
||||
<Nullable>enable</Nullable>
|
||||
</PropertyGroup>
|
||||
|
||||
<ItemGroup>
|
||||
<ProjectReference Include="../../src/RealCV.Application/RealCV.Application.csproj" />
|
||||
<ProjectReference Include="../../src/RealCV.Infrastructure/RealCV.Infrastructure.csproj" />
|
||||
</ItemGroup>
|
||||
|
||||
</Project>
|
||||
445
tools/CVBatchTester/Program.cs
Normal file
@@ -0,0 +1,445 @@
|
||||
using System.Text.Json;
|
||||
using System.Text.Json.Serialization;
|
||||
using Microsoft.EntityFrameworkCore;
|
||||
using Microsoft.Extensions.Configuration;
|
||||
using Microsoft.Extensions.DependencyInjection;
|
||||
using Microsoft.Extensions.Logging;
|
||||
using RealCV.Application.Interfaces;
|
||||
using RealCV.Application.Models;
|
||||
using RealCV.Infrastructure.Configuration;
|
||||
using RealCV.Infrastructure.Data;
|
||||
using RealCV.Infrastructure.ExternalApis;
|
||||
using RealCV.Infrastructure.Services;
|
||||
|
||||
namespace CVBatchTester;
|
||||
|
||||
// DTOs for test JSON format (snake_case with nested personal object)
|
||||
record TestCVData
|
||||
{
|
||||
public string? CvId { get; init; }
|
||||
public string? Category { get; init; }
|
||||
public List<string>? ExpectedFlags { get; init; }
|
||||
public TestPersonalData? Personal { get; init; }
|
||||
public string? Profile { get; init; }
|
||||
public List<TestEmploymentEntry>? Employment { get; init; }
|
||||
public List<TestEducationEntry>? Education { get; init; }
|
||||
public List<string>? Skills { get; init; }
|
||||
}
|
||||
|
||||
record TestPersonalData
|
||||
{
|
||||
public string? Name { get; init; }
|
||||
public string? Email { get; init; }
|
||||
public string? Phone { get; init; }
|
||||
public string? Address { get; init; }
|
||||
public string? LinkedIn { get; init; }
|
||||
}
|
||||
|
||||
record TestEmploymentEntry
|
||||
{
|
||||
public string? Company { get; init; }
|
||||
public string? JobTitle { get; init; }
|
||||
public string? StartDate { get; init; }
|
||||
public string? EndDate { get; init; }
|
||||
public string? Location { get; init; }
|
||||
public string? Description { get; init; }
|
||||
public List<string>? Achievements { get; init; }
|
||||
}
|
||||
|
||||
record TestEducationEntry
|
||||
{
|
||||
public string? Institution { get; init; }
|
||||
public string? Qualification { get; init; }
|
||||
public string? Subject { get; init; }
|
||||
public string? Classification { get; init; }
|
||||
public string? StartDate { get; init; }
|
||||
public string? EndDate { get; init; }
|
||||
}
|
||||
|
||||
class Program
|
||||
{
|
||||
private static StreamWriter? _logWriter;
|
||||
|
||||
private static readonly JsonSerializerOptions JsonOptions = new()
|
||||
{
|
||||
PropertyNameCaseInsensitive = true,
|
||||
PropertyNamingPolicy = JsonNamingPolicy.SnakeCaseLower,
|
||||
Converters = { new JsonStringEnumConverter() }
|
||||
};
|
||||
|
||||
static async Task<int> Main(string[] args)
|
||||
{
|
||||
var folderPath = args.FirstOrDefault() ?? AskForFolder();
|
||||
|
||||
if (string.IsNullOrEmpty(folderPath) || !Directory.Exists(folderPath))
|
||||
{
|
||||
Log($"Error: Folder not found: {folderPath}");
|
||||
Log("Usage: CVBatchTester <folder-path> [--output <file>]");
|
||||
Log(" e.g. CVBatchTester /home/user/cvs");
|
||||
Log(" e.g. CVBatchTester /home/user/cvs --output /tmp/results.log");
|
||||
return 1;
|
||||
}
|
||||
|
||||
// Check for --output flag
|
||||
var outputIndex = Array.IndexOf(args, "--output");
|
||||
var logPath = outputIndex >= 0 && outputIndex < args.Length - 1
|
||||
? args[outputIndex + 1]
|
||||
: Path.Combine(folderPath, $"batch-results-{DateTime.Now:yyyyMMdd-HHmmss}.log");
|
||||
|
||||
_logWriter = new StreamWriter(logPath, false) { AutoFlush = true };
|
||||
|
||||
Log($"CV Batch Verification Tester");
|
||||
Log($"Processing CVs from: {folderPath}");
|
||||
Log($"Output log: {logPath}");
|
||||
Log($"Started: {DateTime.Now:yyyy-MM-dd HH:mm:ss}");
|
||||
Log(new string('=', 80));
|
||||
|
||||
// Setup DI
|
||||
var services = new ServiceCollection();
|
||||
ConfigureServices(services);
|
||||
var provider = services.BuildServiceProvider();
|
||||
|
||||
// Find CV files
|
||||
var cvFiles = Directory.GetFiles(folderPath, "*.*", SearchOption.TopDirectoryOnly)
|
||||
.Where(f => f.EndsWith(".pdf", StringComparison.OrdinalIgnoreCase) ||
|
||||
f.EndsWith(".docx", StringComparison.OrdinalIgnoreCase) ||
|
||||
f.EndsWith(".doc", StringComparison.OrdinalIgnoreCase) ||
|
||||
f.EndsWith(".json", StringComparison.OrdinalIgnoreCase))
|
||||
.OrderBy(f => f)
|
||||
.ToList();
|
||||
|
||||
Log($"Found {cvFiles.Count} CV files\n");
|
||||
|
||||
if (cvFiles.Count == 0)
|
||||
{
|
||||
Log("No CV files found (.pdf, .docx, .doc, .json)");
|
||||
return 1;
|
||||
}
|
||||
|
||||
// Track results
|
||||
var allUnverifiedEmployers = new List<string>();
|
||||
var allUnverifiedInstitutions = new List<string>();
|
||||
var totalEmployers = 0;
|
||||
var verifiedEmployers = 0;
|
||||
var totalEducation = 0;
|
||||
var verifiedEducation = 0;
|
||||
var processedCount = 0;
|
||||
var errorCount = 0;
|
||||
|
||||
foreach (var cvFile in cvFiles)
|
||||
{
|
||||
Log($"\n{new string('=', 80)}");
|
||||
Log($"[{++processedCount}/{cvFiles.Count}] {Path.GetFileName(cvFile)}");
|
||||
Log(new string('=', 80));
|
||||
|
||||
try
|
||||
{
|
||||
using var scope = provider.CreateScope();
|
||||
var parser = scope.ServiceProvider.GetRequiredService<ICVParserService>();
|
||||
var companyVerifier = scope.ServiceProvider.GetRequiredService<ICompanyVerifierService>();
|
||||
var eduVerifier = scope.ServiceProvider.GetRequiredService<IEducationVerifierService>();
|
||||
|
||||
// Parse CV - handle JSON files differently
|
||||
CVData cv;
|
||||
if (cvFile.EndsWith(".json", StringComparison.OrdinalIgnoreCase))
|
||||
{
|
||||
var jsonContent = await File.ReadAllTextAsync(cvFile);
|
||||
var testCv = JsonSerializer.Deserialize<TestCVData>(jsonContent, JsonOptions)
|
||||
?? throw new InvalidOperationException("Failed to deserialize JSON CV");
|
||||
|
||||
// Convert TestCVData to CVData
|
||||
cv = ConvertTestCVData(testCv);
|
||||
Log($"Loaded JSON CV: {cv.FullName}");
|
||||
}
|
||||
else
|
||||
{
|
||||
await using var stream = File.OpenRead(cvFile);
|
||||
cv = await parser.ParseAsync(stream, Path.GetFileName(cvFile));
|
||||
Log($"Parsed CV: {cv.FullName}");
|
||||
}
|
||||
|
||||
// Verify Employers
|
||||
if (cv.Employment?.Count > 0)
|
||||
{
|
||||
Log($"\nEMPLOYERS ({cv.Employment.Count}):");
|
||||
Log(new string('-', 60));
|
||||
|
||||
foreach (var emp in cv.Employment)
|
||||
{
|
||||
totalEmployers++;
|
||||
try
|
||||
{
|
||||
var result = await companyVerifier.VerifyCompanyAsync(
|
||||
emp.CompanyName,
|
||||
emp.StartDate,
|
||||
emp.EndDate,
|
||||
emp.JobTitle);
|
||||
|
||||
var icon = result.IsVerified ? "✓" : "✗";
|
||||
var period = FormatPeriod(emp.StartDate, emp.EndDate);
|
||||
|
||||
Log($"\n {icon} {emp.CompanyName}");
|
||||
Log($" Period: {period}");
|
||||
Log($" Role: {emp.JobTitle}");
|
||||
|
||||
if (result.IsVerified)
|
||||
{
|
||||
verifiedEmployers++;
|
||||
Log($" Match: {result.MatchedCompanyName} ({result.MatchScore}%)");
|
||||
if (!string.IsNullOrEmpty(result.MatchedCompanyNumber))
|
||||
Log($" Company #: {result.MatchedCompanyNumber}");
|
||||
if (!string.IsNullOrEmpty(result.CompanyStatus))
|
||||
Log($" Status: {result.CompanyStatus}");
|
||||
}
|
||||
else
|
||||
{
|
||||
allUnverifiedEmployers.Add(emp.CompanyName);
|
||||
}
|
||||
|
||||
if (!string.IsNullOrEmpty(result.VerificationNotes))
|
||||
Log($" Note: {result.VerificationNotes}");
|
||||
}
|
||||
catch (Exception ex)
|
||||
{
|
||||
Log($"\n ✗ {emp.CompanyName}");
|
||||
Log($" ERROR: {ex.Message}");
|
||||
allUnverifiedEmployers.Add(emp.CompanyName);
|
||||
}
|
||||
}
|
||||
}
|
||||
|
||||
// Verify Education
|
||||
if (cv.Education?.Count > 0)
|
||||
{
|
||||
Log($"\nEDUCATION ({cv.Education.Count}):");
|
||||
Log(new string('-', 60));
|
||||
|
||||
var eduEntries = cv.Education.Select(e => new EducationEntry
|
||||
{
|
||||
Institution = e.Institution,
|
||||
Qualification = e.Qualification,
|
||||
Subject = e.Subject,
|
||||
StartDate = e.StartDate,
|
||||
EndDate = e.EndDate
|
||||
}).ToList();
|
||||
|
||||
var eduResults = eduVerifier.VerifyAll(eduEntries);
|
||||
|
||||
foreach (var result in eduResults)
|
||||
{
|
||||
totalEducation++;
|
||||
var icon = result.IsVerified ? "✓" : "✗";
|
||||
|
||||
Log($"\n {icon} {result.ClaimedInstitution}");
|
||||
Log($" Qualification: {result.ClaimedQualification}");
|
||||
if (!string.IsNullOrEmpty(result.ClaimedSubject))
|
||||
Log($" Subject: {result.ClaimedSubject}");
|
||||
|
||||
if (result.IsVerified)
|
||||
{
|
||||
verifiedEducation++;
|
||||
if (result.MatchedInstitution != null &&
|
||||
!result.MatchedInstitution.Equals(result.ClaimedInstitution, StringComparison.OrdinalIgnoreCase))
|
||||
{
|
||||
Log($" Match: {result.MatchedInstitution}");
|
||||
}
|
||||
}
|
||||
else
|
||||
{
|
||||
allUnverifiedInstitutions.Add(result.ClaimedInstitution ?? "Unknown");
|
||||
Log($" Status: {result.Status}");
|
||||
}
|
||||
|
||||
if (!string.IsNullOrEmpty(result.VerificationNotes))
|
||||
Log($" Note: {result.VerificationNotes}");
|
||||
}
|
||||
}
|
||||
}
|
||||
catch (Exception ex)
|
||||
{
|
||||
errorCount++;
|
||||
Log($"ERROR processing file: {ex.Message}");
|
||||
}
|
||||
}
|
||||
|
||||
// Print Summary
|
||||
Log($"\n\n{new string('=', 80)}");
|
||||
Log("VERIFICATION SUMMARY");
|
||||
Log(new string('=', 80));
|
||||
|
||||
Log($"\nCVs Processed: {processedCount - errorCount}/{cvFiles.Count}");
|
||||
if (errorCount > 0)
|
||||
Log($"Errors: {errorCount}");
|
||||
|
||||
var empRate = totalEmployers > 0 ? verifiedEmployers * 100 / totalEmployers : 0;
|
||||
var eduRate = totalEducation > 0 ? verifiedEducation * 100 / totalEducation : 0;
|
||||
|
||||
Log($"\nEmployers: {verifiedEmployers}/{totalEmployers} verified ({empRate}%)");
|
||||
Log($"Education: {verifiedEducation}/{totalEducation} verified ({eduRate}%)");
|
||||
|
||||
// List unverified employers
|
||||
var uniqueUnverifiedEmployers = allUnverifiedEmployers
|
||||
.GroupBy(e => e, StringComparer.OrdinalIgnoreCase)
|
||||
.OrderByDescending(g => g.Count())
|
||||
.ThenBy(g => g.Key)
|
||||
.ToList();
|
||||
|
||||
if (uniqueUnverifiedEmployers.Count > 0)
|
||||
{
|
||||
Log($"\n{new string('-', 60)}");
|
||||
Log($"UNVERIFIED EMPLOYERS ({uniqueUnverifiedEmployers.Count} unique):");
|
||||
foreach (var group in uniqueUnverifiedEmployers)
|
||||
{
|
||||
var count = group.Count() > 1 ? $" (x{group.Count()})" : "";
|
||||
Log($" - {group.Key}{count}");
|
||||
}
|
||||
}
|
||||
|
||||
// List unverified institutions
|
||||
var uniqueUnverifiedInstitutions = allUnverifiedInstitutions
|
||||
.GroupBy(i => i, StringComparer.OrdinalIgnoreCase)
|
||||
.OrderByDescending(g => g.Count())
|
||||
.ThenBy(g => g.Key)
|
||||
.ToList();
|
||||
|
||||
if (uniqueUnverifiedInstitutions.Count > 0)
|
||||
{
|
||||
Log($"\n{new string('-', 60)}");
|
||||
Log($"UNVERIFIED INSTITUTIONS ({uniqueUnverifiedInstitutions.Count} unique):");
|
||||
foreach (var group in uniqueUnverifiedInstitutions)
|
||||
{
|
||||
var count = group.Count() > 1 ? $" (x{group.Count()})" : "";
|
||||
Log($" - {group.Key}{count}");
|
||||
}
|
||||
}
|
||||
|
||||
Log($"\nCompleted: {DateTime.Now:yyyy-MM-dd HH:mm:ss}");
|
||||
Log($"\n{new string('=', 80)}");
|
||||
|
||||
_logWriter?.Close();
|
||||
Console.WriteLine($"\nResults written to: {logPath}");
|
||||
|
||||
return 0;
|
||||
}
|
||||
|
||||
static void Log(string message)
|
||||
{
|
||||
Console.WriteLine(message);
|
||||
_logWriter?.WriteLine(message);
|
||||
}
|
||||
|
||||
static string AskForFolder()
|
||||
{
|
||||
Console.Write("Enter CV folder path: ");
|
||||
return Console.ReadLine() ?? "";
|
||||
}
|
||||
|
||||
static string FormatPeriod(DateOnly? start, DateOnly? end)
|
||||
{
|
||||
var startStr = start?.ToString("MMM yyyy") ?? "?";
|
||||
var endStr = end?.ToString("MMM yyyy") ?? "Present";
|
||||
return $"{startStr} - {endStr}";
|
||||
}
|
||||
|
||||
static CVData ConvertTestCVData(TestCVData testCv)
|
||||
{
|
||||
return new CVData
|
||||
{
|
||||
FullName = testCv.Personal?.Name ?? "Unknown",
|
||||
Email = testCv.Personal?.Email,
|
||||
Phone = testCv.Personal?.Phone,
|
||||
Employment = testCv.Employment?.Select(e => new EmploymentEntry
|
||||
{
|
||||
CompanyName = e.Company ?? "Unknown",
|
||||
JobTitle = e.JobTitle ?? "Unknown",
|
||||
Location = e.Location,
|
||||
StartDate = ParseDate(e.StartDate),
|
||||
EndDate = ParseDate(e.EndDate),
|
||||
IsCurrent = e.EndDate == null,
|
||||
Description = e.Description
|
||||
}).ToList() ?? [],
|
||||
Education = testCv.Education?.Select(e => new EducationEntry
|
||||
{
|
||||
Institution = e.Institution ?? "Unknown",
|
||||
Qualification = e.Qualification,
|
||||
Subject = e.Subject,
|
||||
StartDate = ParseDate(e.StartDate),
|
||||
EndDate = ParseDate(e.EndDate)
|
||||
}).ToList() ?? [],
|
||||
Skills = testCv.Skills ?? []
|
||||
};
|
||||
}
|
||||
|
||||
static DateOnly? ParseDate(string? dateStr)
|
||||
{
|
||||
if (string.IsNullOrEmpty(dateStr)) return null;
|
||||
|
||||
// Try parsing YYYY-MM format
|
||||
if (dateStr.Length == 7 && dateStr[4] == '-')
|
||||
{
|
||||
if (int.TryParse(dateStr[..4], out var year) && int.TryParse(dateStr[5..], out var month))
|
||||
{
|
||||
return new DateOnly(year, month, 1);
|
||||
}
|
||||
}
|
||||
|
||||
// Try standard parsing
|
||||
if (DateOnly.TryParse(dateStr, out var date))
|
||||
{
|
||||
return date;
|
||||
}
|
||||
|
||||
return null;
|
||||
}
|
||||
|
||||
static void ConfigureServices(IServiceCollection services)
|
||||
{
|
||||
// Load configuration - try multiple locations
|
||||
var configPaths = new[]
|
||||
{
|
||||
"/var/www/realcv",
|
||||
"/git/RealCV/src/RealCV.Web",
|
||||
Path.GetFullPath(Path.Combine(AppContext.BaseDirectory, "..", "..", "..", "..", "..", "src", "RealCV.Web"))
|
||||
};
|
||||
|
||||
var webProjectPath = configPaths.FirstOrDefault(Directory.Exists) ?? "/git/RealCV/src/RealCV.Web";
|
||||
Log($"Loading config from: {webProjectPath}");
|
||||
|
||||
var configuration = new ConfigurationBuilder()
|
||||
.SetBasePath(webProjectPath)
|
||||
.AddJsonFile("appsettings.json", optional: true)
|
||||
.AddJsonFile("appsettings.Development.json", optional: true)
|
||||
.AddJsonFile("appsettings.Production.json", optional: true)
|
||||
.Build();
|
||||
|
||||
// Logging - show info level for verification details
|
||||
services.AddLogging(builder =>
|
||||
{
|
||||
builder.AddConsole();
|
||||
builder.SetMinimumLevel(LogLevel.Information);
|
||||
// Filter out noisy libraries
|
||||
builder.AddFilter("Microsoft", LogLevel.Warning);
|
||||
builder.AddFilter("System", LogLevel.Warning);
|
||||
});
|
||||
|
||||
// Database
|
||||
var connectionString = configuration.GetConnectionString("DefaultConnection")
|
||||
?? "Server=127.0.0.1;Database=RealCV;User Id=SA;Password=TrueCV_Sql2024!;TrustServerCertificate=True";
|
||||
|
||||
services.AddDbContextFactory<ApplicationDbContext>(options =>
|
||||
options.UseSqlServer(connectionString));
|
||||
|
||||
// Companies House - use configuration binding
|
||||
services.Configure<CompaniesHouseSettings>(configuration.GetSection(CompaniesHouseSettings.SectionName));
|
||||
services.AddHttpClient<CompaniesHouseClient>();
|
||||
|
||||
// Anthropic - use configuration binding
|
||||
services.Configure<AnthropicSettings>(configuration.GetSection(AnthropicSettings.SectionName));
|
||||
services.AddScoped<ICompanyNameMatcherService, AICompanyNameMatcherService>();
|
||||
|
||||
// Services
|
||||
services.AddScoped<ICompanyVerifierService, CompanyVerifierService>();
|
||||
services.AddScoped<IEducationVerifierService, EducationVerifierService>();
|
||||
services.AddScoped<ICVParserService, CVParserService>();
|
||||
}
|
||||
}
|
||||
195
tools/batch-test-cvs.cs
Normal file
@@ -0,0 +1,195 @@
|
||||
#!/usr/bin/env dotnet-script
|
||||
#r "nuget: Microsoft.EntityFrameworkCore.SqlServer, 8.0.0"
|
||||
#r "nuget: Microsoft.Extensions.Configuration.Json, 8.0.0"
|
||||
#r "nuget: Microsoft.Extensions.DependencyInjection, 8.0.0"
|
||||
#r "nuget: Microsoft.Extensions.Logging.Console, 8.0.0"
|
||||
#r "../src/RealCV.Application/bin/Debug/net8.0/RealCV.Application.dll"
|
||||
#r "../src/RealCV.Infrastructure/bin/Debug/net8.0/RealCV.Infrastructure.dll"
|
||||
#r "../src/RealCV.Domain/bin/Debug/net8.0/RealCV.Domain.dll"
|
||||
|
||||
// This is a dotnet-script file. Run with: dotnet script batch-test-cvs.cs -- /path/to/cvs
|
||||
// Install dotnet-script: dotnet tool install -g dotnet-script
|
||||
|
||||
using System;
|
||||
using System.IO;
|
||||
using System.Linq;
|
||||
using System.Threading.Tasks;
|
||||
using System.Collections.Generic;
|
||||
using System.Text.Json;
|
||||
using Microsoft.EntityFrameworkCore;
|
||||
using Microsoft.Extensions.Configuration;
|
||||
using Microsoft.Extensions.DependencyInjection;
|
||||
using Microsoft.Extensions.Logging;
|
||||
using RealCV.Application.Interfaces;
|
||||
using RealCV.Application.Models;
|
||||
using RealCV.Infrastructure.Data;
|
||||
using RealCV.Infrastructure.Services;
|
||||
using RealCV.Infrastructure.ExternalApis;
|
||||
using RealCV.Infrastructure.Configuration;
|
||||
|
||||
var folderPath = Args.FirstOrDefault() ?? "/tmp/test-cvs";
|
||||
|
||||
if (!Directory.Exists(folderPath))
|
||||
{
|
||||
Console.WriteLine($"Error: Folder not found: {folderPath}");
|
||||
Console.WriteLine("Usage: dotnet script batch-test-cvs.cs -- /path/to/cvs");
|
||||
return 1;
|
||||
}
|
||||
|
||||
Console.WriteLine($"Processing CVs from: {folderPath}");
|
||||
Console.WriteLine(new string('=', 80));
|
||||
|
||||
// Setup DI
|
||||
var services = new ServiceCollection();
|
||||
|
||||
var configuration = new ConfigurationBuilder()
|
||||
.SetBasePath(Path.Combine(Directory.GetCurrentDirectory(), "../src/RealCV.Web"))
|
||||
.AddJsonFile("appsettings.json", optional: true)
|
||||
.AddJsonFile("appsettings.Development.json", optional: true)
|
||||
.Build();
|
||||
|
||||
services.AddLogging(b => b.AddConsole().SetMinimumLevel(LogLevel.Warning));
|
||||
|
||||
services.AddDbContextFactory<ApplicationDbContext>(options =>
|
||||
options.UseSqlServer(configuration.GetConnectionString("DefaultConnection")));
|
||||
|
||||
services.Configure<CompaniesHouseSettings>(configuration.GetSection("CompaniesHouse"));
|
||||
services.Configure<AnthropicSettings>(configuration.GetSection("Anthropic"));
|
||||
|
||||
services.AddHttpClient<CompaniesHouseClient>();
|
||||
services.AddHttpClient<AnthropicClient>();
|
||||
services.AddScoped<ICompanyNameMatcherService, CompanyNameMatcherService>();
|
||||
services.AddScoped<ICompanyVerifierService, CompanyVerifierService>();
|
||||
services.AddScoped<IEducationVerifierService, EducationVerifierService>();
|
||||
services.AddScoped<ICVParserService, CVParserService>();
|
||||
|
||||
var provider = services.BuildServiceProvider();
|
||||
|
||||
var cvFiles = Directory.GetFiles(folderPath, "*.*")
|
||||
.Where(f => f.EndsWith(".pdf", StringComparison.OrdinalIgnoreCase) ||
|
||||
f.EndsWith(".docx", StringComparison.OrdinalIgnoreCase))
|
||||
.ToList();
|
||||
|
||||
Console.WriteLine($"Found {cvFiles.Count} CV files\n");
|
||||
|
||||
var allUnverifiedEmployers = new List<string>();
|
||||
var allUnverifiedInstitutions = new List<string>();
|
||||
var totalEmployers = 0;
|
||||
var verifiedEmployers = 0;
|
||||
var totalEducation = 0;
|
||||
var verifiedEducation = 0;
|
||||
|
||||
foreach (var cvFile in cvFiles)
|
||||
{
|
||||
Console.WriteLine($"\n{'=',-80}");
|
||||
Console.WriteLine($"FILE: {Path.GetFileName(cvFile)}");
|
||||
Console.WriteLine($"{'=',-80}");
|
||||
|
||||
try
|
||||
{
|
||||
using var scope = provider.CreateScope();
|
||||
var parser = scope.ServiceProvider.GetRequiredService<ICVParserService>();
|
||||
var companyVerifier = scope.ServiceProvider.GetRequiredService<ICompanyVerifierService>();
|
||||
var eduVerifier = scope.ServiceProvider.GetRequiredService<IEducationVerifierService>();
|
||||
|
||||
await using var stream = File.OpenRead(cvFile);
|
||||
var cv = await parser.ParseAsync(stream, Path.GetFileName(cvFile));
|
||||
|
||||
Console.WriteLine($"Candidate: {cv.PersonalInfo?.FullName ?? "Unknown"}");
|
||||
|
||||
// Employers
|
||||
if (cv.Employment?.Count > 0)
|
||||
{
|
||||
Console.WriteLine($"\nEMPLOYERS ({cv.Employment.Count}):");
|
||||
foreach (var emp in cv.Employment)
|
||||
{
|
||||
totalEmployers++;
|
||||
var result = await companyVerifier.VerifyCompanyAsync(
|
||||
emp.CompanyName, emp.StartDate, emp.EndDate, emp.JobTitle);
|
||||
|
||||
var icon = result.IsVerified ? "✓" : "✗";
|
||||
Console.WriteLine($" {icon} {emp.CompanyName}");
|
||||
|
||||
if (result.IsVerified)
|
||||
{
|
||||
verifiedEmployers++;
|
||||
Console.WriteLine($" → {result.MatchedCompanyName} ({result.MatchScore}%)");
|
||||
if (!string.IsNullOrEmpty(result.VerificationNotes))
|
||||
Console.WriteLine($" Note: {result.VerificationNotes}");
|
||||
}
|
||||
else
|
||||
{
|
||||
allUnverifiedEmployers.Add(emp.CompanyName);
|
||||
Console.WriteLine($" Note: {result.VerificationNotes ?? "Not found"}");
|
||||
}
|
||||
}
|
||||
}
|
||||
|
||||
// Education
|
||||
if (cv.Education?.Count > 0)
|
||||
{
|
||||
Console.WriteLine($"\nEDUCATION ({cv.Education.Count}):");
|
||||
var eduEntries = cv.Education.Select(e => new EducationEntry
|
||||
{
|
||||
Institution = e.Institution,
|
||||
Qualification = e.Qualification,
|
||||
Subject = e.Subject,
|
||||
StartDate = e.StartDate,
|
||||
EndDate = e.EndDate
|
||||
}).ToList();
|
||||
|
||||
var eduResults = eduVerifier.VerifyAll(eduEntries);
|
||||
foreach (var result in eduResults)
|
||||
{
|
||||
totalEducation++;
|
||||
var icon = result.IsVerified ? "✓" : "✗";
|
||||
Console.WriteLine($" {icon} {result.ClaimedInstitution}");
|
||||
Console.WriteLine($" {result.ClaimedQualification}");
|
||||
|
||||
if (result.IsVerified)
|
||||
{
|
||||
verifiedEducation++;
|
||||
if (result.MatchedInstitution != null && result.MatchedInstitution != result.ClaimedInstitution)
|
||||
Console.WriteLine($" → {result.MatchedInstitution}");
|
||||
}
|
||||
else
|
||||
{
|
||||
allUnverifiedInstitutions.Add(result.ClaimedInstitution ?? "Unknown");
|
||||
Console.WriteLine($" Status: {result.Status}");
|
||||
if (!string.IsNullOrEmpty(result.VerificationNotes))
|
||||
Console.WriteLine($" Note: {result.VerificationNotes}");
|
||||
}
|
||||
}
|
||||
}
|
||||
}
|
||||
catch (Exception ex)
|
||||
{
|
||||
Console.WriteLine($"ERROR: {ex.Message}");
|
||||
}
|
||||
}
|
||||
|
||||
// Summary
|
||||
Console.WriteLine($"\n\n{'=',-80}");
|
||||
Console.WriteLine("SUMMARY");
|
||||
Console.WriteLine($"{'=',-80}");
|
||||
Console.WriteLine($"CVs Processed: {cvFiles.Count}");
|
||||
Console.WriteLine($"Employers: {verifiedEmployers}/{totalEmployers} verified ({(totalEmployers > 0 ? verifiedEmployers * 100 / totalEmployers : 0)}%)");
|
||||
Console.WriteLine($"Education: {verifiedEducation}/{totalEducation} verified ({(totalEducation > 0 ? verifiedEducation * 100 / totalEducation : 0)}%)");
|
||||
|
||||
var uniqueUnverifiedEmployers = allUnverifiedEmployers.Distinct().OrderBy(x => x).ToList();
|
||||
if (uniqueUnverifiedEmployers.Count > 0)
|
||||
{
|
||||
Console.WriteLine($"\nUNVERIFIED EMPLOYERS ({uniqueUnverifiedEmployers.Count}):");
|
||||
foreach (var emp in uniqueUnverifiedEmployers)
|
||||
Console.WriteLine($" - {emp}");
|
||||
}
|
||||
|
||||
var uniqueUnverifiedInstitutions = allUnverifiedInstitutions.Distinct().OrderBy(x => x).ToList();
|
||||
if (uniqueUnverifiedInstitutions.Count > 0)
|
||||
{
|
||||
Console.WriteLine($"\nUNVERIFIED INSTITUTIONS ({uniqueUnverifiedInstitutions.Count}):");
|
||||
foreach (var inst in uniqueUnverifiedInstitutions)
|
||||
Console.WriteLine($" - {inst}");
|
||||
}
|
||||
|
||||
return 0;
|
||||