respect-validation/src-dev/Commands/UpdateDomainToplevelCommand.php
Henrique Moody 7892a7c902
Port Bash scripts to PHP
It makes more sense to use PHP to generate PHP code than to use Bash. I
love writing Bash scripts, but I know it's not for everyone, and they
can become quite complex. Porting them to PHP code also lowers the
barrier for people to change them.

While I was making those changes, I also noticed a problem with how we
save the domain suffixes. We're converting all of them to ASCII, so we
are not preserving languages such as Chinese, Thai, and Hebrew, which
use non-ASCII characters.
2026-01-06 10:06:22 +01:00

95 lines
2.7 KiB
PHP

<?php
/*
* Copyright (c) Alexandre Gomes Gaigalas <alganet@gmail.com>
* SPDX-License-Identifier: MIT
*/
declare(strict_types=1);
namespace Respect\Dev\Commands;
use Symfony\Component\Console\Attribute\AsCommand;
use Symfony\Component\Console\Command\Command;
use Symfony\Component\Console\Input\InputInterface;
use Symfony\Component\Console\Output\OutputInterface;
use Symfony\Component\Console\Style\SymfonyStyle;
use Symfony\Component\VarExporter\VarExporter;
use function basename;
use function count;
use function dirname;
use function explode;
use function file_get_contents;
use function file_put_contents;
use function implode;
use function sprintf;
use function str_starts_with;
use function trim;
use const PHP_EOL;
#[AsCommand(
name: 'update:domain-toplevel',
description: 'Update list of Top Level Domains (TLD) in the Tld validator',
)]
final class UpdateDomainToplevelCommand extends Command
{
private const string LIST_URL = 'https://data.iana.org/TLD/tlds-alpha-by-domain.txt';
protected function execute(InputInterface $input, OutputInterface $output): int
{
$io = new SymfonyStyle($input, $output);
$io->title('Updating TLD list');
// Download the list
$io->section('Downloading list');
$io->text(sprintf('Fetching from: %s', self::LIST_URL));
$listContent = file_get_contents(self::LIST_URL);
if ($listContent === false) {
$io->error('Failed to download TLD list');
return Command::FAILURE;
}
$io->success('Downloaded successfully');
// Process the list
$io->section('Processing TLD list');
$lines = explode("\n", trim($listContent));
$tlds = [];
foreach ($lines as $line) {
$line = trim($line);
if ($line === '' || str_starts_with($line, '#')) {
continue;
}
$tlds[] = $line;
}
// Create the data file
$dataFilename = dirname(__DIR__, 2) . '/data/domain/tld.php';
$fileContent = implode(PHP_EOL, [
'<?php declare(strict_types=1);',
'// Copyright (c) https://data.iana.org/TLD/',
'// SPDX-License-Identifier: MPL-2.0',
'return ' . VarExporter::export($tlds) . ';' . PHP_EOL,
]);
// Write the data file
if (file_put_contents($dataFilename, $fileContent) === false) {
$io->error('Failed to write data file');
return Command::FAILURE;
}
$io->success(sprintf('Updated %s successfully', basename($dataFilename)));
$io->text(sprintf('Total TLDs: %d', count($tlds)));
return Command::SUCCESS;
}
}