Subversion Repositories SvarDOS

Rev

Rev 920 | Rev 922 | Go to most recent revision | Details | Compare with Previous | Last modification | View Log | RSS feed

Rev Author Line No. Line
562 mateuszvis 1
<?php /*
2
 
3
  SvarDOS repo index builder
4
  Copyright (C) Mateusz Viste 2012-2022
5
 
734 bttr 6
  buildidx computes an index json file for the SvarDOS repository.
673 mateusz.vi 7
  it must be executed pointing to a directory that stores packages (*.svp)
562 mateuszvis 8
  files. buildidx will generate the index file and save it into the package
9
  repository.
10
 
11
  requires php-zip
12
 
912 mateusz.vi 13
  21 feb 2022: buildidx collects categories looking at the dir layout of each package + improved version string parsing (replaced version_compare call by dos_version_compare)
775 mateusz.vi 14
  17 feb 2022: checking for non-8+3 filenames in packages and duplicates + devload no longer part of CORE
736 mateusz.vi 15
  16 feb 2022: added warning about overlong version strings and wild files location
719 mateusz.vi 16
  15 feb 2022: index is generated as json, contains all filenames and alt versions
673 mateusz.vi 17
  14 feb 2022: packages are expected to have the *.svp extension
650 mateusz.vi 18
  12 feb 2022: skip source packages from being processed (*.src.zip)
562 mateuszvis 19
  20 jan 2022: rewritten the code from ANSI C to PHP for easier maintenance
20
  13 feb 2021: 'title' LSM field is no longer looked after
21
  11 feb 2021: lsm headers are no longer checked, so it is compatible with the simpler lsm format used by SvarDOS
22
  13 jan 2021: removed the identification line, changed CRC32 to bsum, not creating the listing.txt file and stopped compressing index
23
  23 apr 2017: uncompressed index is no longer created, added CRC32 of zib (bin only) files, if present
24
  28 aug 2016: listing.txt is always written inside the repo dir (instead of inside current dir)
25
  27 aug 2016: accepting full paths to repos (starting with /...)
26
  07 dec 2013: rewritten buildidx in ANSI C89
27
  19 aug 2013: add a compressed version of the index file to repos (index.gz)
28
  22 jul 2013: creating a listing.txt file with list of packages
29
  18 jul 2013: writing the number of packaged into the first line of the lst file
30
  11 jul 2013: added a switch to 7za to make it case insensitive when extracting lsm files
31
  10 jul 2013: changed unzip calls to 7za (to handle cases when appinfo is compressed with lzma)
32
  04 feb 2013: added CRC32 support
33
  22 sep 2012: forked 1st version from FDUPDATE builder
34
*/
35
 
921 mateusz.vi 36
$PVER = "20220222";
562 mateuszvis 37
 
38
 
39
// computes the BSD sum of a file and returns it
40
function file2bsum($fname) {
41
  $result = 0;
42
 
43
  $fd = fopen($fname, 'rb');
44
  if ($fd === false) return(0);
45
 
46
  while (!feof($fd)) {
47
 
48
    $buff = fread($fd, 1024 * 1024);
49
 
563 mateuszvis 50
    $slen = strlen($buff);
51
    for ($i = 0; $i < $slen; $i++) {
562 mateuszvis 52
      // rotr
53
      $result = ($result >> 1) | ($result << 15);
54
      // add and truncate to 16 bits
563 mateuszvis 55
      $result += ord($buff[$i]);
562 mateuszvis 56
      $result &= 0xffff;
57
    }
58
  }
59
 
60
  fclose($fd);
61
  return($result);
62
}
63
 
64
 
912 mateusz.vi 65
// translates a version string into a array of integer values.
66
// Accepted formats follow:
67
//    300.12.1
68
//    1
69
//    12.2.34.2-4.5
70
//    1.2c
71
//    1.01 beta+3
72
//    2013-12-31
73
//    20220222 alpha
74
function vertoarr($verstr) {
75
  $subver = array(0,0,0,0);
76
 
77
  // switch string to lcase for easier processing and trim any leading or trailing white spaces
78
  $verstr = strtolower(trim($verstr));
79
 
80
  // replace all '-' and '/' characters to '.' (uniformization of sub-version parts delimiters)
81
  $verstr = strtr($verstr, '-/', '..');
82
 
83
  // is there a subversion value? (for example "+4" in "1.05+4")
84
  $i = strrpos($verstr, '+', 1);
85
  if ($i !== false) {
86
    // validate the svar-version is a proper integer
87
    $svarver = substr($verstr, $i + 1);
88
    if (! preg_match('/[1-9][0-9]*/', $svarver)) {
89
      return(false);
90
    }
91
    $subver[3] = intval($svarver); // set the +rev as a very minor item
92
    $verstr = substr($verstr, 0, $i);
93
  }
94
 
921 mateusz.vi 95
  // is the version ending with ' alpha', 'beta', etc?
96
  if (preg_match('/ (alpha|beta|gamma|delta|pre|rc)( [0-9]{1,4}){0,1}$/', $verstr)) {
97
    // if there is a trailing beta-number, process it first
98
    if (preg_match('/ [0-9]{1,4}$/', $verstr)) {
99
      $i = strrpos($verstr, ' ');
100
      $subver[2] = intval(substr($verstr, $i + 1));
101
      $verstr = trim(substr($verstr, 0, $i));
102
    }
912 mateusz.vi 103
    $i = strrpos($verstr, ' ');
104
    $greek = substr($verstr, $i + 1);
105
    $verstr = trim(substr($verstr, 0, $i));
106
    if ($greek == 'alpha') {
921 mateusz.vi 107
      $subver[1] = 1;
912 mateusz.vi 108
    } else if ($greek == 'beta') {
921 mateusz.vi 109
      $subver[1] = 2;
920 mateusz.vi 110
    } else if ($greek == 'gamma') {
921 mateusz.vi 111
      $subver[1] = 3;
920 mateusz.vi 112
    } else if ($greek == 'delta') {
921 mateusz.vi 113
      $subver[1] = 4;
114
    } else if ($greek == 'pre') {
115
      $subver[1] = 5;
914 mateusz.vi 116
    } else if ($greek == 'rc') {
921 mateusz.vi 117
      $subver[1] = 6;
912 mateusz.vi 118
    } else {
119
      return(false);
120
    }
914 mateusz.vi 121
  } else {
921 mateusz.vi 122
    $subver[1] = 99;
912 mateusz.vi 123
  }
124
 
125
  // does the version string have a single-letter subversion? (1.0c)
126
  if (preg_match('/[a-z]$/', $verstr)) {
921 mateusz.vi 127
    $subver[0] = ord(substr($verstr, -1));
912 mateusz.vi 128
    $verstr = substr_replace($verstr, '', -1); // remove last character from string
129
  }
130
 
131
  // validate the format is supported, should be something no more complex than 1.05.3.33
919 mateusz.vi 132
  if (! preg_match('/^[0-9][0-9.]{0,20}$/', $verstr)) {
912 mateusz.vi 133
    return(false);
134
  }
135
 
136
  // NOTE: a zero right after a separator and trailed with a digit (as in 1.01)
137
  //       has a special meaning
138
  $exploded = explode('.', $verstr);
139
  if (count($exploded) > 16) {
140
    return(false);
141
  }
921 mateusz.vi 142
  $exploded[16] = $subver[0]; // a-z (1.0c)
143
  $exploded[17] = $subver[1]; // alpha/beta/gamma/delta/rc/pre
144
  $exploded[18] = $subver[2]; // alpha-beta-gamma subversion (eg. "beta 9")
912 mateusz.vi 145
  $exploded[19] = $subver[3]; // svar-ver (1.0+5)
146
  for ($i = 0; $i < 20; $i++) if (empty($exploded[$i])) $exploded[$i] = '0';
147
 
148
  ksort($exploded);
149
 
150
  return($exploded);
151
}
152
 
153
 
154
function dos_version_compare($v1, $v2) {
155
  $v1arr = vertoarr($v1);
156
  $v2arr = vertoarr($v2);
157
  for ($i = 0; $i < count($v1arr); $i++) {
921 mateusz.vi 158
    if ($v1arr[$i] > $v2arr[$i]) return(1);
159
    if ($v1arr[$i] < $v2arr[$i]) return(-1);
912 mateusz.vi 160
  }
161
  return(0);
162
}
163
 
164
 
562 mateuszvis 165
// reads file fil from zip archive z and returns its content, or false on error
166
function read_file_from_zip($z, $fil) {
167
  $zip = new ZipArchive;
168
  if ($zip->open($z, ZipArchive::RDONLY) !== true) {
169
    echo "ERROR: failed to open zip file '{$z}'\n";
170
    return(false);
171
  }
172
 
173
  // load the appinfo/pkgname.lsm file
174
  $res = $zip->getFromName($fil, 8192, ZipArchive::FL_NOCASE);
175
 
176
  $zip->close();
177
  return($res);
178
}
179
 
180
 
731 mateusz.vi 181
function read_list_of_files_in_zip($z) {
182
  $zip = new ZipArchive;
183
  if ($zip->open($z, ZipArchive::RDONLY) !== true) {
184
    echo "ERROR: failed to open zip file '{$z}'\n";
185
    return(false);
186
  }
187
 
188
  $res = array();
189
  for ($i = 0; $i < $zip->numFiles; $i++) $res[] = $zip->getNameIndex($i);
190
 
191
  $zip->close();
192
  return($res);
193
}
194
 
195
 
562 mateuszvis 196
// reads a LSM string and returns it in the form of an array
197
function parse_lsm($s) {
198
  $res = array();
199
  for ($l = strtok($s, "\n"); $l !== false; $l = strtok("\n")) {
200
    // the line is "token: value", let's find the colon
201
    $colpos = strpos($l, ':');
202
    if (($colpos === false) || ($colpos === 0)) continue;
203
    $tok = strtolower(trim(substr($l, 0, $colpos)));
204
    $val = trim(substr($l, $colpos + 1));
205
    $res[$tok] = $val;
206
  }
207
  return($res);
208
}
209
 
210
 
731 mateusz.vi 211
// on PHP 8+ there is str_starts_with(), but not on PHP 7 so I use this
212
function str_head_is($haystack, $needle) {
213
  return strpos($haystack, $needle) === 0;
214
}
215
 
216
 
791 mateusz.vi 217
// returns an array that contains CORE packages (populated from the core subdirectory in pkgdir)
218
function load_core_list($repodir) {
219
  $res = array();
220
 
221
  foreach (scandir($repodir . '/core/') as $f) {
222
    if (!preg_match('/\.svp$/', $f)) continue;
223
    $res[] = explode('.', $f)[0];
224
  }
225
  return($res);
226
}
227
 
228
 
562 mateuszvis 229
// ***************** MAIN ROUTINE *********************************************
230
 
719 mateusz.vi 231
//echo "SvarDOS repository index generator ver {$PVER}\n";
562 mateuszvis 232
 
233
if (($_SERVER['argc'] != 2) || ($_SERVER['argv'][1][0] == '-')) {
234
  echo "usage: php buildidx.php repodir\n";
235
  exit(1);
236
}
237
 
238
$repodir = $_SERVER['argv'][1];
239
 
240
$pkgfiles = scandir($repodir);
241
$pkgcount = 0;
242
 
738 mateusz.vi 243
 
795 mateusz.vi 244
// load the list of CORE and MSDOS_COMPAT packages
738 mateusz.vi 245
 
791 mateusz.vi 246
$core_packages_list = load_core_list($repodir);
804 bttr 247
$msdos_compat_list = explode(' ', 'append assign attrib chkdsk choice command comp cpidos debug defrag deltree diskcomp diskcopy display edit edlin exe2bin fc fdapm fdisk find format help himemx kernel keyb label localcfg mem mirror mode more move nlsfunc print replace share shsucdx sort swsubst tree undelete unformat xcopy');
738 mateusz.vi 248
 
719 mateusz.vi 249
// do a list of all svp packages with their available versions and descriptions
562 mateuszvis 250
 
719 mateusz.vi 251
$pkgdb = array();
252
foreach ($pkgfiles as $fname) {
801 mateusz.vi 253
  if (!preg_match('/\.svp$/i', $fname)) continue; // skip non-svp files
562 mateuszvis 254
 
801 mateusz.vi 255
  if (!preg_match('/^[a-zA-Z0-9+. _-]*\.svp$/', $fname)) {
256
    echo "ERROR: {$fname} has a very weird name\n";
257
    continue;
258
  }
259
 
719 mateusz.vi 260
  $path_parts = pathinfo($fname);
261
  $pkgnam = explode('-', $path_parts['filename'])[0];
262
  $pkgfullpath = realpath($repodir . '/' . $fname);
562 mateuszvis 263
 
719 mateusz.vi 264
  $lsm = read_file_from_zip($pkgfullpath, "appinfo/{$pkgnam}.lsm");
562 mateuszvis 265
  if ($lsm == false) {
802 mateusz.vi 266
    echo "ERROR: {$fname} does not contain an LSM file at the expected location\n";
719 mateusz.vi 267
    continue;
562 mateuszvis 268
  }
269
  $lsmarray = parse_lsm($lsm);
270
  if (empty($lsmarray['version'])) {
719 mateusz.vi 271
    echo "ERROR: lsm file in {$fname} does not contain a version\n";
272
    continue;
562 mateuszvis 273
  }
730 mateusz.vi 274
  if (strlen($lsmarray['version']) > 16) {
737 mateusz.vi 275
    echo "ERROR: version string in lsm file of {$fname} is too long (16 chars max)\n";
730 mateusz.vi 276
    continue;
277
  }
562 mateuszvis 278
  if (empty($lsmarray['description'])) {
719 mateusz.vi 279
    echo "ERROR: lsm file in {$fname} does not contain a description\n";
280
    continue;
562 mateuszvis 281
  }
282
 
731 mateusz.vi 283
  // validate the files present in the archive
284
  $listoffiles = read_list_of_files_in_zip($pkgfullpath);
739 mateusz.vi 285
  $pkgdir = $pkgnam;
286
 
768 mateusz.vi 287
  // special rule for "parent and children" packages
288
  if (str_head_is($pkgnam, 'djgpp_')) $pkgdir = 'djgpp'; // djgpp_* packages put their files in djgpp
754 mateusz.vi 289
  if ($pkgnam == 'fbc_help') $pkgdir = 'fbc'; // FreeBASIC help goes to the FreeBASIC dir
802 mateusz.vi 290
  if ($pkgnam == 'clamdb') $pkgdir = 'clamav'; // data patterns for clamav
739 mateusz.vi 291
 
768 mateusz.vi 292
  // array used to detect duplicated entries after lower-case conversion
293
  $duparr = array();
294
 
909 mateusz.vi 295
  // will hold the list of categories that this package belongs to
296
  $catlist = array();
297
 
731 mateusz.vi 298
  foreach ($listoffiles as $f) {
299
    $f = strtolower($f);
768 mateusz.vi 300
    $path_array = explode('/', $f);
301
    // emit a warning when non-8+3 filenames are spotted and find duplicates
302
    foreach ($path_array as $item) {
303
      if (empty($item)) continue; // skip empty items at end of paths (eg. appinfo/)
304
      if (!preg_match("/[a-z0-9!#$%&'()@^_`{}~-]{1,8}(\.[a-z0-9!#$%&'()@^_`{}~-]{1,3}){0,1}/", $item)) {
305
        echo "WARNING: {$fname} contains a non-8+3 path (or weird char): {$item} (in $f)\n";
306
      }
307
    }
308
    // look for dups
309
    if (array_search($f, $duparr) !== false) {
310
      echo "WARNING: {$fname} contains a duplicated entry: '{$f}'\n";
311
    } else {
312
      $duparr[] = $f;
313
    }
731 mateusz.vi 314
    // LSM file is ok
315
    if ($f === "appinfo/{$pkgnam}.lsm") continue;
316
    if ($f === "appinfo/") continue;
795 mateusz.vi 317
    // CORE and MSDOS_COMPAT packages are premium citizens and can do a little more
909 mateusz.vi 318
    $core_or_msdoscompat = 0;
319
    if (array_search($pkgnam, $core_packages_list) !== false) {
320
      $catlist[] = 'core';
321
      $core_or_msdoscompat = 1;
322
    }
323
    if (array_search($pkgnam, $msdos_compat_list) !== false) {
324
      $catlist[] = 'msdos_compat';
325
      $core_or_msdoscompat = 1;
326
    }
327
    if ($core_or_msdoscompat == 1) {
736 mateusz.vi 328
      if (str_head_is($f, 'bin/')) continue;
779 mateusz.vi 329
      if (str_head_is($f, 'cpi/')) continue;
749 mateusz.vi 330
      if (str_head_is($f, "doc/{$pkgdir}/")) continue;
331
      if ($f === 'doc/') continue;
332
      if (str_head_is($f, "nls/{$pkgdir}.")) continue;
333
      if ($f === 'nls/') continue;
736 mateusz.vi 334
    }
798 mateusz.vi 335
    // the help package is allowed to put files in... help
336
    if (($pkgnam == 'help') && (str_head_is($f, 'help/'))) continue;
909 mateusz.vi 337
    // must be category-prefixed file, add it to the list of categories for this package
338
    $catlist[] = explode('/', $f)[0];
749 mateusz.vi 339
    // well-known "category" dirs are okay
739 mateusz.vi 340
    if (str_head_is($f, "progs/{$pkgdir}/")) continue;
731 mateusz.vi 341
    if ($f === 'progs/') continue;
739 mateusz.vi 342
    if (str_head_is($f, "devel/{$pkgdir}/")) continue;
731 mateusz.vi 343
    if ($f === 'devel/') continue;
739 mateusz.vi 344
    if (str_head_is($f, "games/{$pkgdir}/")) continue;
731 mateusz.vi 345
    if ($f === 'games/') continue;
739 mateusz.vi 346
    if (str_head_is($f, "drivers/{$pkgdir}/")) continue;
731 mateusz.vi 347
    if ($f === 'drivers/') continue;
768 mateusz.vi 348
    echo "WARNING: {$fname} contains a file in an illegal location: {$f}\n";
731 mateusz.vi 349
  }
350
 
912 mateusz.vi 351
  // do I understand the version string?
352
  if (vertoarr($lsmarray['version']) === false) echo "WARNING: {$fname} parsing of version string failed ('{$lsmarray['version']}')\n";
353
 
719 mateusz.vi 354
  $meta['fname'] = $fname;
355
  $meta['desc'] = $lsmarray['description'];
909 mateusz.vi 356
  $meta['cats'] = array_unique($catlist);
719 mateusz.vi 357
 
358
  $pkgdb[$pkgnam][$lsmarray['version']] = $meta;
359
}
360
 
801 mateusz.vi 361
 
719 mateusz.vi 362
$db = array();
909 mateusz.vi 363
$cats = array();
719 mateusz.vi 364
 
909 mateusz.vi 365
// ******** compute the version-sorted list of packages with a single *********
366
// ******** description and category list for each package ********************
367
 
719 mateusz.vi 368
// iterate over each svp package
369
foreach ($pkgdb as $pkg => $versions) {
370
 
371
  // sort filenames by version, highest first
912 mateusz.vi 372
  uksort($versions, "dos_version_compare");
719 mateusz.vi 373
  $versions = array_reverse($versions, true);
374
 
375
  foreach ($versions as $ver => $meta) {
376
    $fname = $meta['fname'];
377
    $desc = $meta['desc'];
378
 
379
    $bsum = file2bsum(realpath($repodir . '/' . $fname));
380
 
381
    $meta2['ver'] = strval($ver);
382
    $meta2['bsum'] = $bsum;
383
 
384
    if (empty($db[$pkg]['desc'])) $db[$pkg]['desc'] = $desc;
909 mateusz.vi 385
    if (empty($db[$pkg]['cats'])) {
386
      $db[$pkg]['cats'] = $meta['cats'];
387
      $cats = array_unique(array_merge($cats, $meta['cats']));
388
    }
719 mateusz.vi 389
    $db[$pkg]['versions'][$fname] = $meta2;
390
  }
391
 
562 mateuszvis 392
  $pkgcount++;
393
 
394
}
395
 
719 mateusz.vi 396
if ($pkgcount < 100) echo "WARNING: an unexpectedly low number of packages has been found in the repo ({$pkgcount})\n";
562 mateuszvis 397
 
801 mateusz.vi 398
$json_blob = json_encode($db);
399
if ($json_blob === false) {
400
  echo "ERROR: JSON convertion failed! -> ";
401
  switch (json_last_error()) {
402
    case JSON_ERROR_DEPTH:
403
      echo 'maximum stack depth exceeded';
404
      break;
405
    case JSON_ERROR_STATE_MISMATCH:
406
      echo 'underflow of the modes mismatch';
407
      break;
408
    case JSON_ERROR_CTRL_CHAR:
409
      echo 'unexpected control character found';
410
      break;
411
    case JSON_ERROR_UTF8:
412
      echo 'malformed utf-8 characters';
413
      break;
414
    default:
415
      echo "unknown error";
416
      break;
417
  }
418
  echo "\n";
419
}
420
 
909 mateusz.vi 421
file_put_contents($repodir . '/_index.json', $json_blob);
562 mateuszvis 422
 
909 mateusz.vi 423
$cats_json = json_encode($cats);
424
file_put_contents($repodir . '/_cats.json', $cats_json);
425
 
562 mateuszvis 426
exit(0);
427
 
428
?>