研学线路

master
lion 2 days ago
parent 228413f7f1
commit 96f023f609

@ -497,6 +497,14 @@ class DocTextExtractor
return false;
}
if (preg_match('/^[\d\s]+人$/u', $line)) {
return false;
}
if (preg_match('/^[\d\-\—-–\s]+$/u', $line) && preg_match('/\d{3,}/', $line)) {
return false;
}
if (preg_match('/[\x{0080}-\x{009F}]/u', $line)) {
return true;
}

@ -517,21 +517,6 @@ class StudyTourDeclarationParser
];
}
foreach ($groups as &$group) {
$lastLocation = '';
foreach ($group['items'] as &$item) {
if ($item['location'] !== '') {
$lastLocation = $item['location'];
continue;
}
if ($lastLocation !== '') {
$item['location'] = $lastLocation;
}
}
unset($item);
}
unset($group);
return StudyTourPayload::normalizeRoutePlans($groups);
}
@ -897,6 +882,14 @@ class StudyTourDeclarationParser
return false;
}
if (preg_match('/^[\d\s]+人$/u', $line)) {
return false;
}
if (preg_match('/^[\d\-\—-–\s]+$/u', $line) && preg_match('/\d{3,}/', $line)) {
return false;
}
if (self::isWordMetadataLine($line)) {
return true;
}

@ -250,6 +250,7 @@ class StudyTourPayload
public static function normalizeContactPhones(string $raw): string
{
$raw = str_replace(['—', '', ''], '-', $raw);
$raw = str_replace([',', '', ';', '', '/', '|'], '、', $raw);
$parts = preg_split('/[、\s]+/u', $raw) ?: [];
$parts = array_values(array_filter(array_map('trim', $parts), fn ($p) => $p !== ''));

Loading…
Cancel
Save