File: generate_parser_corpus.php

package info (click to toggle)
php8.4 8.4.11-1
  • links: PTS, VCS
  • area: main
  • in suites: forky, sid, trixie
  • size: 208,108 kB
  • sloc: ansic: 1,060,628; php: 35,345; sh: 11,866; cpp: 7,201; pascal: 4,913; javascript: 3,091; asm: 2,810; yacc: 2,411; makefile: 689; xml: 446; python: 301; awk: 148
file content (24 lines) | stat: -rw-r--r-- 716 bytes parent folder | download | duplicates (3)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
<?php

$testsDir = __DIR__ . '/../../Zend/tests/';
$it = new RecursiveIteratorIterator(
    new RecursiveDirectoryIterator($testsDir),
    RecursiveIteratorIterator::LEAVES_ONLY
);

$corpusDir = __DIR__ . '/corpus/parser';
@mkdir($corpusDir);

$maxLen = 6 * 1024;
foreach ($it as $file) {
    if (!preg_match('/\.phpt$/', $file)) continue;
    $code = file_get_contents($file);
    if (!preg_match('/--FILE--\R(.*?)\R--([_A-Z]+)--/s', $code, $matches)) continue;
    $code = $matches[1];
    if (strlen($code) > $maxLen) continue;

    $outFile = str_replace($testsDir, '', $file);
    $outFile = str_replace('/', '_', $outFile);
    $outFile = $corpusDir . '/' . $outFile;
    file_put_contents($outFile, $code);
}