Fix all UKDS SEO cross-contamination risks

- Remove old sitemaps pointing to ukdataservices.co.uk URLs
- Delete llms.txt/llms-full.txt (had ukdataservices references)
- Replace all web scraping text in PHP files with AI automation equivalents
- Add noindex to legal boilerplate pages (privacy, terms, cookie, GDPR) to prevent duplicate content penalty
- Fix OG/Twitter social card images from ukds-* filenames to ukaiautomation-*
- Fix lead-capture.php to write logs to ukaiautomation directory
- Fix sitemap.php, quote-handler, canonical.php, related-services component
This commit is contained in:
Peter Foster
2026-03-21 10:13:14 +00:00
parent 37a6b01598
commit 8eafc04b0f
29 changed files with 181 additions and 853 deletions

View File

@@ -45,23 +45,23 @@ $related_articles = [
'read_time' => '15 min read'
]
],
'Web Scraping' => [
'AI Automation' => [
[
'title' => 'Web Scraping Compliance UK Guide',
'slug' => 'web-scraping-compliance-uk-guide',
'category' => 'Web Scraping',
'title' => 'AI Automation Compliance UK Guide',
'slug' => 'web-Automation-compliance-uk-guide',
'category' => 'AI Automation',
'read_time' => '10 min read'
],
[
'title' => 'Handling CAPTCHAs in Web Scraping',
'slug' => 'handling-captchas-scraping',
'category' => 'Web Scraping',
'title' => 'Handling CAPTCHAs in AI Automation',
'slug' => 'handling-captchas-Automation',
'category' => 'AI Automation',
'read_time' => '7 min read'
],
[
'title' => 'JavaScript Heavy Sites Scraping',
'slug' => 'javascript-heavy-sites-scraping',
'category' => 'Web Scraping',
'title' => 'JavaScript Heavy Sites Automation',
'slug' => 'javascript-heavy-sites-Automation',
'category' => 'AI Automation',
'read_time' => '9 min read'
]
],
@@ -103,11 +103,11 @@ $display_articles = array_slice($filtered_articles, 0, 3);
<div class="cta-inner">
<div class="cta-text">
<h3>Need data for your business?</h3>
<p>UK AI Automation delivers GDPR-compliant web scraping, data extraction, and analytics — tailored to your industry. 99.8% accuracy, fast turnaround, no long-term contracts.</p>
<p>UK AI Automation delivers GDPR-compliant AI Automation, data extraction, and analytics — tailored to your industry. 99.8% accuracy, fast turnaround, no long-term contracts.</p>
</div>
<div class="cta-actions">
<a href="/quote" class="cta-btn cta-btn-primary">Get a Free Quote</a>
<a href="/services/web-scraping" class="cta-btn cta-btn-outline">See Our Services</a>
<a href="/services/web-Automation" class="cta-btn cta-btn-outline">See Our Services</a>
</div>
</div>
</section>

View File

@@ -18,14 +18,14 @@ $authors = [
'role' => 'Data Intelligence Experts',
'bio' => 'Our editorial team comprises data scientists, engineers, and industry analysts with over 50 combined years of experience in AI automation, data pipelines, and business intelligence across UK industries.',
'linkedin' => null,
'expertise' => ['Web Scraping', 'Data Analytics', 'Business Intelligence', 'GDPR Compliance'],
'expertise' => ['AI Automation', 'Data Analytics', 'Business Intelligence', 'GDPR Compliance'],
'image' => '/assets/images/authors/team-avatar.svg'
],
'James Wilson' => [
'role' => 'Senior Data Architect',
'bio' => 'James is a Senior Data Architect with 12+ years of experience in enterprise web scraping and business intelligence. He holds a Master\'s degree in Computer Science from Imperial College London and is an AWS Solutions Architect Professional.',
'bio' => 'James is a Senior Data Architect with 12+ years of experience in enterprise AI Automation and business intelligence. He holds a Master\'s degree in Computer Science from Imperial College London and is an AWS Solutions Architect Professional.',
'linkedin' => 'https://linkedin.com/company/ukaiautomation',
'expertise' => ['Enterprise Architecture', 'Web Scraping', 'Cloud Solutions', 'Data Pipelines'],
'expertise' => ['Enterprise Architecture', 'AI Automation', 'Cloud Solutions', 'Data Pipelines'],
'image' => '/assets/images/authors/james-wilson.svg'
],
'Dr. Rachel Singh' => [
@@ -36,10 +36,10 @@ $authors = [
'image' => '/assets/images/authors/rachel-singh.svg'
],
'Michael Thompson' => [
'role' => 'Technical Lead - Web Scraping',
'bio' => 'Michael specializes in large-scale web scraping infrastructure and has designed data collection systems for FTSE 100 companies. He has 10+ years of experience in Python, Scrapy, and distributed systems.',
'role' => 'Technical Lead - AI Automation',
'bio' => 'Michael specializes in large-scale AI Automation infrastructure and has designed data collection systems for FTSE 100 companies. He has 10+ years of experience in Python, Scrapy, and distributed systems.',
'linkedin' => 'https://linkedin.com/company/ukaiautomation',
'expertise' => ['Python', 'Scrapy', 'Distributed Systems', 'Web Scraping'],
'expertise' => ['Python', 'Scrapy', 'Distributed Systems', 'AI Automation'],
'image' => '/assets/images/authors/michael-thompson.svg'
],
'Sarah Chen' => [

View File

@@ -112,7 +112,6 @@ function getPageUrl($pageKey) {
// Services
'services' => '/#services',
'web-scraping' => '/services/web-scraping',
'competitive-intelligence' => '/services/competitive-intelligence',
'price-monitoring' => '/services/price-monitoring',
'data-cleaning' => '/services/data-cleaning',

View File

@@ -4,7 +4,7 @@
* Displays related services at the bottom of service pages
*
* Usage:
* $currentService = 'web-scraping';
* $currentService = 'document-extraction';
* include($_SERVER['DOCUMENT_ROOT'] . '/includes/components/related-services.php');
*/

View File

@@ -53,7 +53,7 @@ function generateArticleSchema($title, $description, $datePublished, $dateModifi
'name' => 'UK AI Automation',
'logo' => [
'@type' => 'ImageObject',
'url' => $baseUrl . '/assets/images/ukds-main-logo.png'
'url' => $baseUrl . '/assets/images/ukaiautomation-logo.svg'
]
],
'image' => [
@@ -125,7 +125,7 @@ function generateBlogPostingSchema($title, $description, $datePublished, $dateMo
'name' => 'UK AI Automation',
'logo' => [
'@type' => 'ImageObject',
'url' => $baseUrl . '/assets/images/ukds-main-logo.png',
'url' => $baseUrl . '/assets/images/ukaiautomation-logo.svg',
'width' => 300,
'height' => 100
]
@@ -173,7 +173,7 @@ $authorProfiles = [
'technical-team' => [
'name' => 'UK AI Automation Technical Team',
'role' => 'Senior Data Engineers',
'description' => 'Expert engineers specializing in web scraping technologies, data pipelines, and enterprise data solutions.'
'description' => 'Expert engineers specializing in AI Automation technologies, data pipelines, and enterprise data solutions.'
],
'compliance-team' => [
'name' => 'UK AI Automation Compliance Team',

View File

@@ -5,7 +5,7 @@
*
* Usage:
* $faqs = [
* ['question' => 'What is web scraping?', 'answer' => 'Web scraping is...'],
* ['question' => 'What is AI Automation?', 'answer' => 'AI Automation is...'],
* ['question' => 'How much does it cost?', 'answer' => 'Pricing varies...']
* ];
* include($_SERVER['DOCUMENT_ROOT'] . '/includes/schema/faq-schema.php');
@@ -63,12 +63,12 @@ function generateFAQSchema($faqs, $pageUrl = null, $pageName = null) {
$commonFAQs = [
'general' => [
[
'question' => 'What is web scraping and how can it benefit my business?',
'answer' => 'Web scraping is the automated process of extracting data from websites. It benefits businesses by providing competitive intelligence, automating data collection, enabling real-time price monitoring, and supporting strategic decision-making with accurate market data.'
'question' => 'What is AI Automation and how can it benefit my business?',
'answer' => 'AI Automation is the automated process of extracting data from websites. It benefits businesses by providing competitive intelligence, automating data collection, enabling real-time price monitoring, and supporting strategic decision-making with accurate market data.'
],
[
'question' => 'Is web scraping legal in the UK?',
'answer' => 'Yes, web scraping is legal in the UK when conducted properly. We ensure full compliance with UK Data Protection Act 2018, GDPR, website terms of service, and industry best practices. We only collect publicly available data and respect robots.txt directives.'
'question' => 'Is AI Automation legal in the UK?',
'answer' => 'Yes, AI Automation is legal in the UK when conducted properly. We ensure full compliance with UK Data Protection Act 2018, GDPR, website terms of service, and industry best practices. We only collect publicly available data and respect robots.txt directives.'
],
[
'question' => 'How do you ensure data accuracy?',
@@ -85,7 +85,7 @@ $commonFAQs = [
],
'pricing' => [
[
'question' => 'What factors affect the cost of web scraping services?',
'question' => 'What factors affect the cost of AI Automation Services?',
'answer' => 'Costs depend on several factors: the number and complexity of target websites, data volume required, frequency of updates, anti-bot measures to navigate, data cleaning requirements, and delivery format preferences.'
],
[

View File

@@ -9,7 +9,7 @@
* 'region' => 'Greater London',
* 'latitude' => 51.5074,
* 'longitude' => -0.1278,
* 'services' => ['Web Scraping', 'Data Analytics']
* 'services' => ['AI Automation', 'Data Analytics']
* ];
* include($_SERVER['DOCUMENT_ROOT'] . '/includes/schema/local-business-schema.php');
*/
@@ -33,7 +33,7 @@ function generateLocalBusinessSchema($city, $region, $services = [], $latitude =
'@type' => 'LocalBusiness',
'@id' => $baseUrl . '/locations/' . $citySlug . '#localbusiness',
'name' => 'UK AI Automation - ' . $city,
'description' => 'Professional web scraping, data extraction, and business intelligence services for ' . $city . ' businesses. GDPR-compliant data solutions across ' . $region . '.',
'description' => 'Professional AI Automation, data extraction, and business intelligence services for ' . $city . ' businesses. GDPR-compliant data solutions across ' . $region . '.',
'url' => $baseUrl . '/locations/' . $citySlug,
'telephone' => '',
'email' => 'info@ukaiautomation.co.uk',
@@ -58,7 +58,7 @@ function generateLocalBusinessSchema($city, $region, $services = [], $latitude =
'@id' => $baseUrl . '/#organization',
'name' => 'UK AI Automation'
],
'image' => $baseUrl . '/assets/images/ukds-main-logo.png',
'image' => $baseUrl . '/assets/images/ukaiautomation-logo.svg',
'sameAs' => [
'https://www.linkedin.com/company/ukaiautomation',
'https://twitter.com/ukaiautomation'
@@ -129,7 +129,7 @@ $locationConfigs = [
'latitude' => 51.5074,
'longitude' => -0.1278,
'services' => [
'Web Scraping',
'AI Automation',
'Data Analytics',
'Financial Data Services',
'Competitive Intelligence',
@@ -150,7 +150,7 @@ $locationConfigs = [
'longitude' => -2.2426,
'services' => [
'Data Analytics',
'Web Scraping',
'AI Automation',
'Business Intelligence',
'Price Monitoring',
'Data Cleaning'
@@ -170,7 +170,7 @@ $locationConfigs = [
'longitude' => -1.8904,
'services' => [
'Data Services',
'Web Scraping',
'AI Automation',
'Business Intelligence',
'Data Cleaning',
'Competitive Intelligence'
@@ -190,7 +190,7 @@ $locationConfigs = [
'longitude' => -3.1883,
'services' => [
'Data Analytics',
'Web Scraping',
'AI Automation',
'Financial Data',
'Business Intelligence'
],
@@ -208,7 +208,7 @@ $locationConfigs = [
'longitude' => -3.1791,
'services' => [
'Data Services',
'Web Scraping',
'AI Automation',
'Business Intelligence',
'Data Cleaning'
],

View File

@@ -114,7 +114,7 @@ $siteTestimonials = [
[
'author' => 'James Mitchell',
'authorRole' => 'Retail Director, London Fashion Group',
'reviewBody' => 'UK AI Automation transformed our competitor analysis process. Their web scraping accuracy and speed helped us make better pricing decisions. We\'ve seen a 23% improvement in our market positioning since working with them.',
'reviewBody' => 'UK AI Automation transformed our competitor analysis process. Their AI Automation accuracy and speed helped us make better pricing decisions. We\'ve seen a 23% improvement in our market positioning since working with them.',
'ratingValue' => 5,
'datePublished' => '2024-09-15'
],
@@ -159,11 +159,11 @@ $siteTestimonials = [
* Service-specific testimonials
*/
$serviceTestimonials = [
'web-scraping' => [
'web-Automation' => [
[
'author' => 'Robert Harris',
'authorRole' => 'CTO, E-commerce Solutions Ltd',
'reviewBody' => 'Their web scraping capabilities are world-class. They handled complex JavaScript-rendered pages with ease and delivered clean, accurate data exactly as specified.',
'reviewBody' => 'Their AI Automation capabilities are world-class. They handled complex JavaScript-rendered pages with ease and delivered clean, accurate data exactly as specified.',
'ratingValue' => 5
]
],

View File

@@ -5,10 +5,10 @@
*
* Usage:
* $serviceData = [
* 'name' => 'Web Scraping Services',
* 'description' => 'Professional web scraping services...',
* 'url' => 'https://ukaiautomation.co.uk/services/web-scraping',
* 'serviceType' => 'Web Scraping',
* 'name' => 'AI Automation Services',
* 'description' => 'Professional AI Automation Services...',
* 'url' => 'https://ukaiautomation.co.uk/services/web-Automation',
* 'serviceType' => 'AI Automation',
* 'priceRange' => '500-50000',
* 'features' => ['Feature 1', 'Feature 2']
* ];
@@ -96,11 +96,11 @@ function generateServiceSchema($serviceName, $serviceDescription, $serviceUrl, $
* Predefined service configurations for consistency
*/
$serviceConfigs = [
'web-scraping' => [
'name' => 'Web Scraping Services UK',
'description' => 'Professional web scraping and data extraction services for UK businesses. Automated data collection from websites with 99.8% accuracy and full GDPR compliance.',
'url' => 'https://ukaiautomation.co.uk/services/web-scraping',
'serviceType' => 'Web Scraping',
'web-Automation' => [
'name' => 'AI Automation Services UK',
'description' => 'Professional AI Automation and data extraction services for UK businesses. Automated data collection from websites with 99.8% accuracy and full GDPR compliance.',
'url' => 'https://ukaiautomation.co.uk/services/web-Automation',
'serviceType' => 'AI Automation',
'priceRange' => '500-50000',
'features' => [
'Automated data extraction',

View File

@@ -5,7 +5,7 @@
*
* Usage:
* include($_SERVER['DOCUMENT_ROOT'] . '/includes/url-config.php');
* echo $urlMap['services']['web-scraping'];
* echo $urlMap['services']['web-Automation'];
*/
$baseUrl = 'https://ukaiautomation.co.uk';
@@ -26,7 +26,7 @@ $urlMap = [
// Services
'services' => [
'index' => '/#services',
'web-scraping' => '/services/web-scraping',
'web-Automation' => '/services/web-Automation',
'competitive-intelligence' => '/services/competitive-intelligence',
'price-monitoring' => '/services/price-monitoring',
'data-cleaning' => '/services/data-cleaning',
@@ -48,7 +48,7 @@ $urlMap = [
// Blog categories
'blog-categories' => [
'web-scraping' => '/blog/categories/web-scraping',
'web-Automation' => '/blog/categories/web-Automation',
'data-analytics' => '/blog/categories/data-analytics',
'business-intelligence' => '/blog/categories/business-intelligence',
'compliance' => '/blog/categories/compliance',
@@ -96,7 +96,7 @@ $serviceData = [
'title' => 'Custom AI Agents',
'shortTitle' => 'AI Agents',
'description' => 'Bespoke AI agents that handle repetitive workflows autonomously',
'icon' => 'icon-web-scraping-v2.svg'
'icon' => 'icon-web-Automation-v2.svg'
],
];
@@ -108,13 +108,13 @@ $locationData = [
'url' => '/locations/london',
'title' => 'London',
'region' => 'Greater London',
'description' => 'Web scraping and data analytics services in London'
'description' => 'AI Automation and data analytics services in London'
],
'manchester' => [
'url' => '/locations/manchester',
'title' => 'Manchester',
'region' => 'Greater Manchester',
'description' => 'Data analytics and web scraping services in Manchester'
'description' => 'Data analytics and AI Automation Services in Manchester'
],
'birmingham' => [
'url' => '/locations/birmingham',
@@ -126,7 +126,7 @@ $locationData = [
'url' => '/locations/edinburgh',
'title' => 'Edinburgh',
'region' => 'Scotland',
'description' => 'Data analytics and web scraping services in Edinburgh'
'description' => 'Data analytics and AI Automation Services in Edinburgh'
],
'cardiff' => [
'url' => '/locations/cardiff',
@@ -140,14 +140,14 @@ $locationData = [
* Related services mapping for cross-linking
*/
$relatedServices = [
'web-scraping' => ['competitive-intelligence', 'price-monitoring', 'data-cleaning'],
'competitive-intelligence' => ['web-scraping', 'price-monitoring', 'data-analytics'],
'price-monitoring' => ['web-scraping', 'competitive-intelligence', 'data-analytics'],
'data-cleaning' => ['web-scraping', 'data-analytics', 'api-development'],
'web-Automation' => ['competitive-intelligence', 'price-monitoring', 'data-cleaning'],
'competitive-intelligence' => ['web-Automation', 'price-monitoring', 'data-analytics'],
'price-monitoring' => ['web-Automation', 'competitive-intelligence', 'data-analytics'],
'data-cleaning' => ['web-Automation', 'data-analytics', 'api-development'],
'data-analytics' => ['competitive-intelligence', 'data-cleaning', 'api-development'],
'api-development' => ['web-scraping', 'data-cleaning', 'data-analytics'],
'property-data-extraction' => ['web-scraping', 'data-cleaning', 'competitive-intelligence'],
'financial-data-services' => ['web-scraping', 'data-analytics', 'api-development']
'api-development' => ['web-Automation', 'data-cleaning', 'data-analytics'],
'property-data-extraction' => ['web-Automation', 'data-cleaning', 'competitive-intelligence'],
'financial-data-services' => ['web-Automation', 'data-analytics', 'api-development']
];
/**