feat: impact-media page type with OG scraping and cache
All checks were successful
Deploy / Deploy to Production (push) Successful in 12s
All checks were successful
Deploy / Deploy to Production (push) Successful in 12s
- Add impact-media blueprint (entries field + linked investigation) - Add minimal impact-media template - Refactor card-open-graph snippet: accepts $url param, Kirby cache (6h TTL), decode HTML entities, empty alt on images - Update impacts.yml to allow impact-media pages - Render impact-media in investigation aside with dynamic count + details/summary - Add OG cache config in config.php - CSS formatting fixes (body, card-block-small, category) Co-Authored-By: Claude Opus 4.6 <noreply@anthropic.com>
This commit is contained in:
parent
b8352c81fa
commit
f757906584
11 changed files with 505 additions and 452 deletions
|
|
@ -1,111 +1,109 @@
|
|||
<?php
|
||||
// URL à scraper (remplacez par l'URL souhaitée)
|
||||
$url = 'https://www.lemonde.fr/societe/article/2025/07/16/au-c-ur-des-emeutes-de-nouvelle-caledonie-quand-la-mort-de-banane-abattu-par-le-gign-lance-le-siege-de-saint-louis_6621496_3224.html';
|
||||
<?php
|
||||
/**
|
||||
* Card Open Graph snippet
|
||||
* Fetches and displays OG data from an external URL with cache.
|
||||
*
|
||||
* @var string $url The URL to scrape OG data from
|
||||
*/
|
||||
|
||||
// Fonction pour récupérer les données Open Graph
|
||||
function getOpenGraphData($url) {
|
||||
$ogData = [
|
||||
'title' => '',
|
||||
'description' => '',
|
||||
'image' => '',
|
||||
'site_name' => '',
|
||||
'url' => $url
|
||||
];
|
||||
if (empty($url)) return;
|
||||
|
||||
// Configuration du contexte pour éviter les erreurs SSL
|
||||
$context = stream_context_create([
|
||||
'http' => [
|
||||
'method' => 'GET',
|
||||
'header' => 'User-Agent: Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36',
|
||||
'timeout' => 10
|
||||
],
|
||||
'ssl' => [
|
||||
'verify_peer' => false,
|
||||
'verify_peer_name' => false
|
||||
]
|
||||
]);
|
||||
$cache = kirby()->cache('og');
|
||||
$cacheKey = md5($url);
|
||||
$ogData = $cache->get($cacheKey);
|
||||
|
||||
// Récupérer le HTML
|
||||
$html = @file_get_contents($url, false, $context);
|
||||
if ($ogData === null) {
|
||||
$ogData = [
|
||||
'title' => '',
|
||||
'description' => '',
|
||||
'image' => '',
|
||||
'site_name' => '',
|
||||
'url' => $url,
|
||||
];
|
||||
|
||||
if ($html === false) {
|
||||
return $ogData;
|
||||
}
|
||||
$context = stream_context_create([
|
||||
'http' => [
|
||||
'method' => 'GET',
|
||||
'header' => 'User-Agent: Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36',
|
||||
'timeout' => 10,
|
||||
],
|
||||
'ssl' => [
|
||||
'verify_peer' => false,
|
||||
'verify_peer_name' => false,
|
||||
],
|
||||
]);
|
||||
|
||||
// Parser les meta tags Open Graph
|
||||
preg_match_all('/<meta\s+property=["\']og:([^"\']+)["\']\s+content=["\']([^"\']+)["\']/i', $html, $matches);
|
||||
$html = @file_get_contents($url, false, $context);
|
||||
|
||||
if (!empty($matches[1])) {
|
||||
foreach ($matches[1] as $index => $property) {
|
||||
$content = $matches[2][$index];
|
||||
switch ($property) {
|
||||
case 'title':
|
||||
$ogData['title'] = htmlspecialchars($content);
|
||||
break;
|
||||
case 'description':
|
||||
$ogData['description'] = htmlspecialchars($content);
|
||||
break;
|
||||
case 'image':
|
||||
$ogData['image'] = $content;
|
||||
break;
|
||||
case 'site_name':
|
||||
$ogData['site_name'] = htmlspecialchars($content);
|
||||
break;
|
||||
}
|
||||
}
|
||||
}
|
||||
if ($html !== false) {
|
||||
// Parse OG meta tags (both property...content and content...property orders)
|
||||
preg_match_all('/<meta\s+(?:property=["\']og:([^"\']+)["\']\s+content=["\']([^"\']*)["\']|content=["\']([^"\']*?)["\']\s+property=["\']og:([^"\']+)["\'])/i', $html, $matches);
|
||||
|
||||
// Fallback: si pas de og:title, utiliser <title>
|
||||
if (empty($ogData['title'])) {
|
||||
preg_match('/<title>([^<]+)<\/title>/i', $html, $titleMatch);
|
||||
if (!empty($titleMatch[1])) {
|
||||
$ogData['title'] = htmlspecialchars($titleMatch[1]);
|
||||
}
|
||||
}
|
||||
if (!empty($matches[1])) {
|
||||
foreach ($matches[1] as $index => $property) {
|
||||
$prop = $property ?: $matches[4][$index];
|
||||
$content = $matches[2][$index] ?: $matches[3][$index];
|
||||
$content = html_entity_decode(trim($content), ENT_QUOTES | ENT_HTML5, 'UTF-8');
|
||||
switch ($prop) {
|
||||
case 'title':
|
||||
$ogData['title'] = $content;
|
||||
break;
|
||||
case 'description':
|
||||
$ogData['description'] = $content;
|
||||
break;
|
||||
case 'image':
|
||||
$ogData['image'] = $content;
|
||||
break;
|
||||
case 'site_name':
|
||||
$ogData['site_name'] = $content;
|
||||
break;
|
||||
}
|
||||
}
|
||||
}
|
||||
|
||||
// Fallback: si pas de site_name, utiliser le domaine
|
||||
if (empty($ogData['site_name'])) {
|
||||
$parsed = parse_url($url);
|
||||
$ogData['site_name'] = $parsed['host'] ?? '';
|
||||
}
|
||||
// Fallback: use <title> if no og:title
|
||||
if (empty($ogData['title'])) {
|
||||
preg_match('/<title>([^<]+)<\/title>/i', $html, $titleMatch);
|
||||
if (!empty($titleMatch[1])) {
|
||||
$ogData['title'] = html_entity_decode($titleMatch[1], ENT_QUOTES, 'UTF-8');
|
||||
}
|
||||
}
|
||||
}
|
||||
|
||||
return $ogData;
|
||||
}
|
||||
// Always use domain as site_name
|
||||
$parsed = parse_url($url);
|
||||
$ogData['site_name'] = $parsed['host'] ?? '';
|
||||
|
||||
$ogData = getOpenGraphData($url);
|
||||
$cache->set($cacheKey, $ogData, 360); // 6 hours
|
||||
}
|
||||
?>
|
||||
|
||||
// Toujours utiliser le domaine de l'URL pour site_name
|
||||
$parsed = parse_url($url);
|
||||
$ogData['site_name'] = $parsed['host'] ?? '';
|
||||
?>
|
||||
<div class="card--open-graph">
|
||||
<div class="open-graph__inner">
|
||||
|
||||
<div class="card--open-graph">
|
||||
<div class="open-graph__inner">
|
||||
<?php if (!empty($ogData['image'])): ?>
|
||||
<figure>
|
||||
<img src="<?= htmlspecialchars($ogData['image']) ?>" alt="">
|
||||
</figure>
|
||||
<?php endif ?>
|
||||
|
||||
<?php if (!empty($ogData['image'])): ?>
|
||||
<figure>
|
||||
<img src="<?= $ogData['image'] ?>" alt="<?= $ogData['title'] ?>">
|
||||
</figure>
|
||||
<?php endif; ?>
|
||||
<div class="content">
|
||||
<?php if (!empty($ogData['site_name'])): ?>
|
||||
<span class="site-name"><?= htmlspecialchars($ogData['site_name']) ?></span>
|
||||
<?php endif ?>
|
||||
|
||||
<div class="content">
|
||||
<?php if (!empty($ogData['site_name'])): ?>
|
||||
<span class="site-name"><?= $ogData['site_name'] ?></span>
|
||||
<?php endif; ?>
|
||||
<?php if (!empty($ogData['title'])): ?>
|
||||
<h3 class="title">
|
||||
<a href="<?= htmlspecialchars($ogData['url']) ?>" target="_blank">
|
||||
<?= htmlspecialchars($ogData['title']) ?>
|
||||
</a>
|
||||
</h3>
|
||||
<?php endif ?>
|
||||
|
||||
<?php if (!empty($ogData['title'])): ?>
|
||||
|
||||
<h3 class="title">
|
||||
<a href="<?= $ogData['url'] ?>" target="_blank">
|
||||
<?= $ogData['title'] ?>
|
||||
</a>
|
||||
</h3>
|
||||
<?php endif; ?>
|
||||
|
||||
<?php if (!empty($ogData['description'])): ?>
|
||||
<p class="description"><?= $ogData['description'] ?></p>
|
||||
<?php endif; ?>
|
||||
</div>
|
||||
<a class="link-block" href="<?= $ogData['url'] ?>" target="_blank"></a>
|
||||
</div>
|
||||
</div>
|
||||
<?php if (!empty($ogData['description'])): ?>
|
||||
<p class="description"><?= htmlspecialchars($ogData['description']) ?></p>
|
||||
<?php endif ?>
|
||||
</div>
|
||||
<a class="link-block" href="<?= htmlspecialchars($ogData['url']) ?>" target="_blank"></a>
|
||||
</div>
|
||||
</div>
|
||||
|
|
|
|||
Loading…
Add table
Add a link
Reference in a new issue