Subversion Repositories SvarDOS

Rev

Rev 941 | Rev 951 | Go to most recent revision | Only display areas with differences | Ignore whitespace | Details | Blame | Last modification | View Log | RSS feed

Rev 941 Rev 946
1
<?php /*
1
<?php /*
2
 
2
 
3
  SvarDOS repo index builder
3
  SvarDOS repo index builder
4
  Copyright (C) Mateusz Viste 2012-2022
4
  Copyright (C) Mateusz Viste 2012-2022
5
 
5
 
6
  buildidx computes an index json file for the SvarDOS repository.
6
  buildidx computes an index json file for the SvarDOS repository.
7
  it must be executed pointing to a directory that stores packages (*.svp)
7
  it must be executed pointing to a directory that stores packages (*.svp)
8
  files. buildidx will generate the index file and save it into the package
8
  files. buildidx will generate the index file and save it into the package
9
  repository.
9
  repository.
10
 
10
 
11
  requires php-zip
11
  requires php-zip
12
 
12
 
13
  23 feb 2022: basic validation of source archives (not empty + matches an existing svp file)
13
  23 feb 2022: basic validation of source archives (not empty + matches an existing svp file)
14
  21 feb 2022: buildidx collects categories looking at the dir layout of each package + improved version string parsing (replaced version_compare call by dos_version_compare)
14
  21 feb 2022: buildidx collects categories looking at the dir layout of each package + improved version string parsing (replaced version_compare call by dos_version_compare)
15
  17 feb 2022: checking for non-8+3 filenames in packages and duplicates + devload no longer part of CORE
15
  17 feb 2022: checking for non-8+3 filenames in packages and duplicates + devload no longer part of CORE
16
  16 feb 2022: added warning about overlong version strings and wild files location
16
  16 feb 2022: added warning about overlong version strings and wild files location
17
  15 feb 2022: index is generated as json, contains all filenames and alt versions
17
  15 feb 2022: index is generated as json, contains all filenames and alt versions
18
  14 feb 2022: packages are expected to have the *.svp extension
18
  14 feb 2022: packages are expected to have the *.svp extension
19
  12 feb 2022: skip source packages from being processed (*.src.zip)
19
  12 feb 2022: skip source packages from being processed (*.src.zip)
20
  20 jan 2022: rewritten the code from ANSI C to PHP for easier maintenance
20
  20 jan 2022: rewritten the code from ANSI C to PHP for easier maintenance
21
  13 feb 2021: 'title' LSM field is no longer looked after
21
  13 feb 2021: 'title' LSM field is no longer looked after
22
  11 feb 2021: lsm headers are no longer checked, so it is compatible with the simpler lsm format used by SvarDOS
22
  11 feb 2021: lsm headers are no longer checked, so it is compatible with the simpler lsm format used by SvarDOS
23
  13 jan 2021: removed the identification line, changed CRC32 to bsum, not creating the listing.txt file and stopped compressing index
23
  13 jan 2021: removed the identification line, changed CRC32 to bsum, not creating the listing.txt file and stopped compressing index
24
  23 apr 2017: uncompressed index is no longer created, added CRC32 of zib (bin only) files, if present
24
  23 apr 2017: uncompressed index is no longer created, added CRC32 of zib (bin only) files, if present
25
  28 aug 2016: listing.txt is always written inside the repo dir (instead of inside current dir)
25
  28 aug 2016: listing.txt is always written inside the repo dir (instead of inside current dir)
26
  27 aug 2016: accepting full paths to repos (starting with /...)
26
  27 aug 2016: accepting full paths to repos (starting with /...)
27
  07 dec 2013: rewritten buildidx in ANSI C89
27
  07 dec 2013: rewritten buildidx in ANSI C89
28
  19 aug 2013: add a compressed version of the index file to repos (index.gz)
28
  19 aug 2013: add a compressed version of the index file to repos (index.gz)
29
  22 jul 2013: creating a listing.txt file with list of packages
29
  22 jul 2013: creating a listing.txt file with list of packages
30
  18 jul 2013: writing the number of packaged into the first line of the lst file
30
  18 jul 2013: writing the number of packaged into the first line of the lst file
31
  11 jul 2013: added a switch to 7za to make it case insensitive when extracting lsm files
31
  11 jul 2013: added a switch to 7za to make it case insensitive when extracting lsm files
32
  10 jul 2013: changed unzip calls to 7za (to handle cases when appinfo is compressed with lzma)
32
  10 jul 2013: changed unzip calls to 7za (to handle cases when appinfo is compressed with lzma)
33
  04 feb 2013: added CRC32 support
33
  04 feb 2013: added CRC32 support
34
  22 sep 2012: forked 1st version from FDUPDATE builder
34
  22 sep 2012: forked 1st version from FDUPDATE builder
35
*/
35
*/
36
 
36
 
37
$PVER = "20220223";
37
$PVER = "20220223";
38
 
38
 
39
 
39
 
40
// computes the BSD sum of a file and returns it
40
// computes the BSD sum of a file and returns it
41
function file2bsum($fname) {
41
function file2bsum($fname) {
42
  $result = 0;
42
  $result = 0;
43
 
43
 
44
  $fd = fopen($fname, 'rb');
44
  $fd = fopen($fname, 'rb');
45
  if ($fd === false) return(0);
45
  if ($fd === false) return(0);
46
 
46
 
47
  while (!feof($fd)) {
47
  while (!feof($fd)) {
48
 
48
 
49
    $buff = fread($fd, 1024 * 1024);
49
    $buff = fread($fd, 1024 * 1024);
50
 
50
 
51
    $slen = strlen($buff);
51
    $slen = strlen($buff);
52
    for ($i = 0; $i < $slen; $i++) {
52
    for ($i = 0; $i < $slen; $i++) {
53
      // rotr
53
      // rotr
54
      $result = ($result >> 1) | ($result << 15);
54
      $result = ($result >> 1) | ($result << 15);
55
      // add and truncate to 16 bits
55
      // add and truncate to 16 bits
56
      $result += ord($buff[$i]);
56
      $result += ord($buff[$i]);
57
      $result &= 0xffff;
57
      $result &= 0xffff;
58
    }
58
    }
59
  }
59
  }
60
 
60
 
61
  fclose($fd);
61
  fclose($fd);
62
  return($result);
62
  return($result);
63
}
63
}
64
 
64
 
65
 
65
 
66
// translates a version string into a array of integer values.
66
// translates a version string into a array of integer values.
67
// Accepted formats follow:
67
// Accepted formats follow:
68
//    300.12.1
68
//    300.12.1
69
//    1
69
//    1
70
//    12.2.34.2-4.5
70
//    12.2.34.2-4.5
71
//    1.2c
71
//    1.2c
72
//    1.01 beta+3
72
//    1.01 beta+3
73
//    2013-12-31
73
//    2013-12-31
74
//    20220222 alpha
74
//    20220222 alpha
75
function vertoarr($verstr) {
75
function vertoarr($verstr) {
76
  $subver = array(0,0,0,0);
76
  $subver = array(0,0,0,0);
77
 
77
 
78
  // switch string to lcase for easier processing and trim any leading or trailing white spaces
78
  // switch string to lcase for easier processing and trim any leading or trailing white spaces
79
  $verstr = strtolower(trim($verstr));
79
  $verstr = strtolower(trim($verstr));
80
 
80
 
81
  // replace all '-' and '/' characters to '.' (uniformization of sub-version parts delimiters)
81
  // replace all '-' and '/' characters to '.' (uniformization of sub-version parts delimiters)
82
  $verstr = strtr($verstr, '-/', '..');
82
  $verstr = strtr($verstr, '-/', '..');
83
 
83
 
84
  // is there a subversion value? (for example "+4" in "1.05+4")
84
  // is there a subversion value? (for example "+4" in "1.05+4")
85
  $i = strrpos($verstr, '+', 1);
85
  $i = strrpos($verstr, '+', 1);
86
  if ($i !== false) {
86
  if ($i !== false) {
87
    // validate the svar-version is a proper integer
87
    // validate the svar-version is a proper integer
88
    $svarver = substr($verstr, $i + 1);
88
    $svarver = substr($verstr, $i + 1);
89
    if (! preg_match('/[1-9][0-9]*/', $svarver)) {
89
    if (! preg_match('/[1-9][0-9]*/', $svarver)) {
90
      return(false);
90
      return(false);
91
    }
91
    }
92
    $subver[3] = intval($svarver); // set the +rev as a very minor item
92
    $subver[3] = intval($svarver); // set the +rev as a very minor item
93
    $verstr = substr($verstr, 0, $i);
93
    $verstr = substr($verstr, 0, $i);
94
  }
94
  }
95
 
95
 
96
  // beta reordering: convert "beta 0.95" to "0.95 beta"
96
  // beta reordering: convert "beta 0.95" to "0.95 beta"
97
  if (preg_match('/^beta /', $verstr)) $verstr = substr($verstr, 5) . ' beta';
97
  if (preg_match('/^beta /', $verstr)) $verstr = substr($verstr, 5) . ' beta';
98
 
98
 
99
  // any occurence of alpha,beta,gamma,delta etc preceded by a digit should have a space separator added
99
  // any occurence of alpha,beta,gamma,delta etc preceded by a digit should have a space separator added
100
  // example: "2.6.0pre9" becomes "2.6.0 pre9"
100
  // example: "2.6.0pre9" becomes "2.6.0 pre9"
101
  $verstr = preg_replace('/([0-9])(alpha|beta|gamma|delta|pre|rc|patch)/', '$1 $2', $verstr);
101
  $verstr = preg_replace('/([0-9])(alpha|beta|gamma|delta|pre|rc|patch)/', '$1 $2', $verstr);
102
 
102
 
103
  // same as above, but this time adding a trailing space separator
103
  // same as above, but this time adding a trailing space separator
104
  // example: "2.6.0 pre9" becomes "2.6.0 pre 9"
104
  // example: "2.6.0 pre9" becomes "2.6.0 pre 9"
105
  $verstr = preg_replace('/(alpha|beta|gamma|delta|pre|rc|patch)([0-9])/', '$1 $2', $verstr);
105
  $verstr = preg_replace('/(alpha|beta|gamma|delta|pre|rc|patch)([0-9])/', '$1 $2', $verstr);
106
 
106
 
107
  // is the version ending with ' alpha', 'beta', etc?
107
  // is the version ending with ' alpha', 'beta', etc?
108
  if (preg_match('/ (alpha|beta|gamma|delta|pre|rc|patch)( [0-9]{1,4}){0,1}$/', $verstr)) {
108
  if (preg_match('/ (alpha|beta|gamma|delta|pre|rc|patch)( [0-9]{1,4}){0,1}$/', $verstr)) {
109
    // if there is a trailing beta-number, process it first
109
    // if there is a trailing beta-number, process it first
110
    if (preg_match('/ [0-9]{1,4}$/', $verstr)) {
110
    if (preg_match('/ [0-9]{1,4}$/', $verstr)) {
111
      $i = strrpos($verstr, ' ');
111
      $i = strrpos($verstr, ' ');
112
      $subver[2] = intval(substr($verstr, $i + 1));
112
      $subver[2] = intval(substr($verstr, $i + 1));
113
      $verstr = trim(substr($verstr, 0, $i));
113
      $verstr = trim(substr($verstr, 0, $i));
114
    }
114
    }
115
    $i = strrpos($verstr, ' ');
115
    $i = strrpos($verstr, ' ');
116
    $greek = substr($verstr, $i + 1);
116
    $greek = substr($verstr, $i + 1);
117
    $verstr = trim(substr($verstr, 0, $i));
117
    $verstr = trim(substr($verstr, 0, $i));
118
    if ($greek == 'alpha') {
118
    if ($greek == 'alpha') {
119
      $subver[1] = 1;
119
      $subver[1] = 1;
120
    } else if ($greek == 'beta') {
120
    } else if ($greek == 'beta') {
121
      $subver[1] = 2;
121
      $subver[1] = 2;
122
    } else if ($greek == 'gamma') {
122
    } else if ($greek == 'gamma') {
123
      $subver[1] = 3;
123
      $subver[1] = 3;
124
    } else if ($greek == 'delta') {
124
    } else if ($greek == 'delta') {
125
      $subver[1] = 4;
125
      $subver[1] = 4;
126
    } else if ($greek == 'pre') {
126
    } else if ($greek == 'pre') {
127
      $subver[1] = 5;
127
      $subver[1] = 5;
128
    } else if ($greek == 'rc') {
128
    } else if ($greek == 'rc') {
129
      $subver[1] = 6;
129
      $subver[1] = 6;
130
    } else if ($greek == 'patch') { // this is a POST-release version, as opposed to all above that are PRE-release versions
130
    } else if ($greek == 'patch') { // this is a POST-release version, as opposed to all above that are PRE-release versions
131
      $subver[1] = 99;
131
      $subver[1] = 99;
132
    } else {
132
    } else {
133
      return(false);
133
      return(false);
134
    }
134
    }
135
  } else {
135
  } else {
136
    $subver[1] = 98; // one less than the 'patch' level
136
    $subver[1] = 98; // one less than the 'patch' level
137
  }
137
  }
138
 
138
 
139
  // does the version string have a single-letter subversion? (1.0c)
139
  // does the version string have a single-letter subversion? (1.0c)
140
  if (preg_match('/[a-z]$/', $verstr)) {
140
  if (preg_match('/[a-z]$/', $verstr)) {
141
    $subver[0] = ord(substr($verstr, -1));
141
    $subver[0] = ord(substr($verstr, -1));
142
    $verstr = substr_replace($verstr, '', -1); // remove last character from string
142
    $verstr = substr_replace($verstr, '', -1); // remove last character from string
143
  }
143
  }
144
 
144
 
145
  // convert "30-jan-99", "1999-jan-30" and "30-jan-1999" versions to "30jan99" or "30jan1999"
145
  // convert "30-jan-99", "1999-jan-30" and "30-jan-1999" versions to "30jan99" or "30jan1999"
146
  // note that dashes have already been replaced by dots
146
  // note that dashes have already been replaced by dots
147
  if (preg_match('/^([0-9][0-9]){1,2}\.(jan|feb|mar|apr|may|jun|jul|aug|sep|oct|nov|dec)\.([0-9][0-9]){1,2}$/', $verstr)) {
147
  if (preg_match('/^([0-9][0-9]){1,2}\.(jan|feb|mar|apr|may|jun|jul|aug|sep|oct|nov|dec)\.([0-9][0-9]){1,2}$/', $verstr)) {
148
    $verstr = str_replace('.', '', $verstr);
148
    $verstr = str_replace('.', '', $verstr);
149
  }
149
  }
150
 
150
 
151
  // convert "2009mar17" versions to "17mar2009"
151
  // convert "2009mar17" versions to "17mar2009"
152
  if (preg_match('/^[0-9]{4}(jan|feb|mar|apr|may|jun|jul|aug|sep|oct|nov|dec)[0-9]{2}$/', $verstr)) {
152
  if (preg_match('/^[0-9]{4}(jan|feb|mar|apr|may|jun|jul|aug|sep|oct|nov|dec)[0-9]{2}$/', $verstr)) {
153
    $dy = substr($verstr, 7);
153
    $dy = substr($verstr, 7);
154
    $mo = substr($verstr, 4, 3);
154
    $mo = substr($verstr, 4, 3);
155
    $ye = substr($verstr, 0, 4);
155
    $ye = substr($verstr, 0, 4);
156
    $verstr = "{$dy}{$mo}{$ye}";
156
    $verstr = "{$dy}{$mo}{$ye}";
157
  }
157
  }
158
 
158
 
159
  // convert "30jan99" versions to 99.1.30 and "30jan1999" to 1999.1.30
159
  // convert "30jan99" versions to 99.1.30 and "30jan1999" to 1999.1.30
160
  if (preg_match('/^[0-3][0-9](jan|feb|mar|apr|may|jun|jul|aug|sep|oct|nov|dec)([0-9][0-9]){1,2}$/', $verstr)) {
160
  if (preg_match('/^[0-3][0-9](jan|feb|mar|apr|may|jun|jul|aug|sep|oct|nov|dec)([0-9][0-9]){1,2}$/', $verstr)) {
161
    $months = array('jan' => 1, 'feb' => 2, 'mar' => 3, 'apr' => 4, 'may' => 5, 'jun' => 6, 'jul' => 7, 'aug' => 8, 'sep' => 9, 'oct' => 10, 'nov' => 11, 'dec' => 12);
161
    $months = array('jan' => 1, 'feb' => 2, 'mar' => 3, 'apr' => 4, 'may' => 5, 'jun' => 6, 'jul' => 7, 'aug' => 8, 'sep' => 9, 'oct' => 10, 'nov' => 11, 'dec' => 12);
162
    $dy = substr($verstr, 0, 2);
162
    $dy = substr($verstr, 0, 2);
163
    $mo = $months[substr($verstr, 2, 3)];
163
    $mo = $months[substr($verstr, 2, 3)];
164
    $ye = substr($verstr, 5);
164
    $ye = substr($verstr, 5);
165
    $verstr = "{$ye}.{$mo}.{$dy}";
165
    $verstr = "{$ye}.{$mo}.{$dy}";
166
  }
166
  }
167
 
167
 
168
  // validate the format is supported, should be something no more complex than 1.05.3.33
168
  // validate the format is supported, should be something no more complex than 1.05.3.33
169
  if (! preg_match('/^[0-9][0-9.]{0,20}$/', $verstr)) {
169
  if (! preg_match('/^[0-9][0-9.]{0,20}$/', $verstr)) {
170
    return(false);
170
    return(false);
171
  }
171
  }
172
 
172
 
173
  // NOTE: a zero right after a separator and trailed with a digit (as in 1.01)
173
  // NOTE: a zero right after a separator and trailed with a digit (as in 1.01)
174
  //       has a special meaning
174
  //       has a special meaning
175
  $exploded = explode('.', $verstr);
175
  $exploded = explode('.', $verstr);
176
  if (count($exploded) > 16) {
176
  if (count($exploded) > 16) {
177
    return(false);
177
    return(false);
178
  }
178
  }
179
  $exploded[16] = $subver[0]; // a-z (1.0c)
179
  $exploded[16] = $subver[0]; // a-z (1.0c)
180
  $exploded[17] = $subver[1]; // alpha/beta/gamma/delta/rc/pre
180
  $exploded[17] = $subver[1]; // alpha/beta/gamma/delta/rc/pre
181
  $exploded[18] = $subver[2]; // alpha-beta-gamma subversion (eg. "beta 9")
181
  $exploded[18] = $subver[2]; // alpha-beta-gamma subversion (eg. "beta 9")
182
  $exploded[19] = $subver[3]; // svar-ver (1.0+5)
182
  $exploded[19] = $subver[3]; // svar-ver (1.0+5)
183
  for ($i = 0; $i < 20; $i++) if (empty($exploded[$i])) $exploded[$i] = '0';
183
  for ($i = 0; $i < 20; $i++) if (empty($exploded[$i])) $exploded[$i] = '0';
184
 
184
 
185
  ksort($exploded);
185
  ksort($exploded);
186
 
186
 
187
  return($exploded);
187
  return($exploded);
188
}
188
}
189
 
189
 
190
 
190
 
191
function dos_version_compare($v1, $v2) {
191
function dos_version_compare($v1, $v2) {
192
  $v1arr = vertoarr($v1);
192
  $v1arr = vertoarr($v1);
193
  $v2arr = vertoarr($v2);
193
  $v2arr = vertoarr($v2);
194
  for ($i = 0; $i < count($v1arr); $i++) {
194
  for ($i = 0; $i < count($v1arr); $i++) {
195
    if ($v1arr[$i] > $v2arr[$i]) return(1);
195
    if ($v1arr[$i] > $v2arr[$i]) return(1);
196
    if ($v1arr[$i] < $v2arr[$i]) return(-1);
196
    if ($v1arr[$i] < $v2arr[$i]) return(-1);
197
  }
197
  }
198
  return(0);
198
  return(0);
199
}
199
}
200
 
200
 
201
 
201
 
202
// reads file fil from zip archive z and returns its content, or false on error
202
// reads file fil from zip archive z and returns its content, or false on error
203
function read_file_from_zip($z, $fil) {
203
function read_file_from_zip($z, $fil) {
204
  $zip = new ZipArchive;
204
  $zip = new ZipArchive;
205
  if ($zip->open($z, ZipArchive::RDONLY) !== true) {
205
  if ($zip->open($z, ZipArchive::RDONLY) !== true) {
206
    echo "ERROR: failed to open zip file '{$z}'\n";
206
    echo "ERROR: failed to open zip file '{$z}'\n";
207
    return(false);
207
    return(false);
208
  }
208
  }
209
 
209
 
210
  // load the appinfo/pkgname.lsm file
210
  // load the appinfo/pkgname.lsm file
211
  $res = $zip->getFromName($fil, 8192, ZipArchive::FL_NOCASE);
211
  $res = $zip->getFromName($fil, 8192, ZipArchive::FL_NOCASE);
212
 
212
 
213
  $zip->close();
213
  $zip->close();
214
  return($res);
214
  return($res);
215
}
215
}
216
 
216
 
217
 
217
 
218
function read_list_of_files_in_zip($z) {
218
function read_list_of_files_in_zip($z) {
219
  $zip = new ZipArchive;
219
  $zip = new ZipArchive;
220
  if ($zip->open($z, ZipArchive::RDONLY) !== true) {
220
  if ($zip->open($z, ZipArchive::RDONLY) !== true) {
221
    echo "ERROR: failed to open zip file '{$z}'\n";
221
    echo "ERROR: failed to open zip file '{$z}'\n";
222
    return(false);
222
    return(false);
223
  }
223
  }
224
 
224
 
225
  $res = array();
225
  $res = array();
226
  for ($i = 0; $i < $zip->numFiles; $i++) $res[] = $zip->getNameIndex($i);
226
  for ($i = 0; $i < $zip->numFiles; $i++) $res[] = $zip->getNameIndex($i);
227
 
227
 
228
  $zip->close();
228
  $zip->close();
229
  return($res);
229
  return($res);
230
}
230
}
231
 
231
 
232
 
232
 
233
// reads a LSM string and returns it in the form of an array
233
// reads a LSM string and returns it in the form of an array
234
function parse_lsm($s) {
234
function parse_lsm($s) {
235
  $res = array();
235
  $res = array();
236
  for ($l = strtok($s, "\n"); $l !== false; $l = strtok("\n")) {
236
  for ($l = strtok($s, "\n"); $l !== false; $l = strtok("\n")) {
237
    // the line is "token: value", let's find the colon
237
    // the line is "token: value", let's find the colon
238
    $colpos = strpos($l, ':');
238
    $colpos = strpos($l, ':');
239
    if (($colpos === false) || ($colpos === 0)) continue;
239
    if (($colpos === false) || ($colpos === 0)) continue;
240
    $tok = strtolower(trim(substr($l, 0, $colpos)));
240
    $tok = strtolower(trim(substr($l, 0, $colpos)));
241
    $val = trim(substr($l, $colpos + 1));
241
    $val = trim(substr($l, $colpos + 1));
242
    $res[$tok] = $val;
242
    $res[$tok] = $val;
243
  }
243
  }
244
  return($res);
244
  return($res);
245
}
245
}
246
 
246
 
247
 
247
 
248
// on PHP 8+ there is str_starts_with(), but not on PHP 7 so I use this
248
// on PHP 8+ there is str_starts_with(), but not on PHP 7 so I use this
249
function str_head_is($haystack, $needle) {
249
function str_head_is($haystack, $needle) {
250
  return strpos($haystack, $needle) === 0;
250
  return strpos($haystack, $needle) === 0;
251
}
251
}
252
 
252
 
253
 
253
 
254
// returns an array that contains CORE packages (populated from the core subdirectory in pkgdir)
254
// returns an array that contains CORE packages (populated from the core subdirectory in pkgdir)
255
function load_core_list($repodir) {
255
function load_core_list($repodir) {
256
  $res = array();
256
  $res = array();
257
 
257
 
258
  foreach (scandir($repodir . '/core/') as $f) {
258
  foreach (scandir($repodir . '/core/') as $f) {
259
    if (!preg_match('/\.svp$/', $f)) continue;
259
    if (!preg_match('/\.svp$/', $f)) continue;
260
    $res[] = explode('.', $f)[0];
260
    $res[] = explode('.', $f)[0];
261
  }
261
  }
262
  return($res);
262
  return($res);
263
}
263
}
264
 
264
 
265
 
265
 
266
// ***************** MAIN ROUTINE *********************************************
266
// ***************** MAIN ROUTINE *********************************************
267
 
267
 
268
//echo "SvarDOS repository index generator ver {$PVER}\n";
268
//echo "SvarDOS repository index generator ver {$PVER}\n";
269
 
269
 
270
if (($_SERVER['argc'] != 2) || ($_SERVER['argv'][1][0] == '-')) {
270
if (($_SERVER['argc'] != 2) || ($_SERVER['argv'][1][0] == '-')) {
271
  echo "usage: php buildidx.php repodir\n";
271
  echo "usage: php buildidx.php repodir\n";
272
  exit(1);
272
  exit(1);
273
}
273
}
274
 
274
 
275
$repodir = $_SERVER['argv'][1];
275
$repodir = $_SERVER['argv'][1];
276
 
276
 
277
$pkgfiles = scandir($repodir);
277
$pkgfiles = scandir($repodir);
278
$pkgcount = 0;
278
$pkgcount = 0;
279
 
279
 
280
 
280
 
281
// load the list of CORE and MSDOS_COMPAT packages
281
// load the list of CORE and MSDOS_COMPAT packages
282
 
282
 
283
$core_packages_list = load_core_list($repodir);
283
$core_packages_list = load_core_list($repodir);
284
$msdos_compat_list = explode(' ', 'append assign attrib chkdsk choice command comp cpidos debug defrag deltree diskcomp diskcopy display edit edlin exe2bin fc fdapm fdisk find format help himemx kernel keyb label localcfg mem mirror mode more move nlsfunc print replace share shsucdx sort swsubst tree undelete unformat xcopy');
284
$msdos_compat_list = explode(' ', 'append assign attrib chkdsk choice command comp cpidos debug defrag deltree diskcomp diskcopy display edit edlin exe2bin fc fdapm fdisk find format help himemx kernel keyb label localcfg mem mirror mode more move nlsfunc print replace share shsucdx sort swsubst tree undelete unformat xcopy');
285
 
285
 
286
// do a list of all svp packages with their available versions and descriptions
286
// do a list of all svp packages with their available versions and descriptions
287
 
287
 
288
$pkgdb = array();
288
$pkgdb = array();
289
foreach ($pkgfiles as $fname) {
289
foreach ($pkgfiles as $fname) {
290
 
290
 
291
  // zip files (ie. source archives)
291
  // zip files (ie. source archives)
292
  if (preg_match('/\.zip$/', $fname)) {
292
  if (preg_match('/\.zip$/', $fname)) {
293
    // the zip archive should contain at least one file
293
    // the zip archive should contain at least one file
294
    if (count(read_list_of_files_in_zip($repodir . '/' . $fname)) < 1) echo "WARNING: source archive {$fname} contains no files (either empty or corrupted)\n";
294
    if (count(read_list_of_files_in_zip($repodir . '/' . $fname)) < 1) echo "WARNING: source archive {$fname} contains no files (either empty or corrupted)\n";
295
    // check that the file relates to an existing svp package
295
    // check that the file relates to an existing svp package
296
    $svpfname = preg_replace('/zip$/', 'svp', $fname);
296
    $svpfname = preg_replace('/zip$/', 'svp', $fname);
297
    if (!file_exists($repodir . '/' . $svpfname)) echo "ERROR: orphaned source archive '{$fname}' (no matching svp file, expecting a package named '{$svpfname}')\n";
297
    if (!file_exists($repodir . '/' . $svpfname)) echo "ERROR: orphaned source archive '{$fname}' (no matching svp file, expecting a package named '{$svpfname}')\n";
298
    // that is for zip files
298
    // that is for zip files
299
    continue;
299
    continue;
300
  }
300
  }
301
 
301
 
302
  // skip (and warn about) non-svp
302
  // skip (and warn about) non-svp
303
  if (!preg_match('/\.svp$/', $fname)) {
303
  if (!preg_match('/\.svp$/', $fname)) {
304
    $okfiles = array('.', '..', '_cats.json', '_index.json', 'core');
304
    $okfiles = array('.', '..', '_cats.json', '_index.json', '_buildidx.log', 'core');
305
    if (array_search($fname, $okfiles) !== false) continue;
305
    if (array_search($fname, $okfiles) !== false) continue;
306
    echo "WARNING: wild file '{$fname} (this is either an useless file that should be removed, or a misnamed package or source archive)'\n";
306
    echo "WARNING: wild file '{$fname} (this is either an useless file that should be removed, or a misnamed package or source archive)'\n";
307
    continue;
307
    continue;
308
  }
308
  }
309
 
309
 
310
  if (!preg_match('/^[a-zA-Z0-9+. _-]*\.svp$/', $fname)) {
310
  if (!preg_match('/^[a-zA-Z0-9+. _-]*\.svp$/', $fname)) {
311
    echo "ERROR: {$fname} has a very weird name\n";
311
    echo "ERROR: {$fname} has a very weird name\n";
312
    continue;
312
    continue;
313
  }
313
  }
314
 
314
 
315
  $path_parts = pathinfo($fname);
315
  $path_parts = pathinfo($fname);
316
  $pkgnam = explode('-', $path_parts['filename'])[0];
316
  $pkgnam = explode('-', $path_parts['filename'])[0];
317
  $pkgfullpath = realpath($repodir . '/' . $fname);
317
  $pkgfullpath = realpath($repodir . '/' . $fname);
318
 
318
 
319
  $lsm = read_file_from_zip($pkgfullpath, "appinfo/{$pkgnam}.lsm");
319
  $lsm = read_file_from_zip($pkgfullpath, "appinfo/{$pkgnam}.lsm");
320
  if ($lsm == false) {
320
  if ($lsm == false) {
321
    echo "ERROR: {$fname} does not contain an LSM file at the expected location\n";
321
    echo "ERROR: {$fname} does not contain an LSM file at the expected location\n";
322
    continue;
322
    continue;
323
  }
323
  }
324
  $lsmarray = parse_lsm($lsm);
324
  $lsmarray = parse_lsm($lsm);
325
  if (empty($lsmarray['version'])) {
325
  if (empty($lsmarray['version'])) {
326
    echo "ERROR: lsm file in {$fname} does not contain a version\n";
326
    echo "ERROR: lsm file in {$fname} does not contain a version\n";
327
    continue;
327
    continue;
328
  }
328
  }
329
  if (strlen($lsmarray['version']) > 16) {
329
  if (strlen($lsmarray['version']) > 16) {
330
    echo "ERROR: version string in lsm file of {$fname} is too long (16 chars max)\n";
330
    echo "ERROR: version string in lsm file of {$fname} is too long (16 chars max)\n";
331
    continue;
331
    continue;
332
  }
332
  }
333
  if (empty($lsmarray['description'])) {
333
  if (empty($lsmarray['description'])) {
334
    echo "ERROR: lsm file in {$fname} does not contain a description\n";
334
    echo "ERROR: lsm file in {$fname} does not contain a description\n";
335
    continue;
335
    continue;
336
  }
336
  }
337
 
337
 
338
  // validate the files present in the archive
338
  // validate the files present in the archive
339
  $listoffiles = read_list_of_files_in_zip($pkgfullpath);
339
  $listoffiles = read_list_of_files_in_zip($pkgfullpath);
340
  $pkgdir = $pkgnam;
340
  $pkgdir = $pkgnam;
341
 
341
 
342
  // special rule for "parent and children" packages
342
  // special rule for "parent and children" packages
343
  if (str_head_is($pkgnam, 'djgpp_')) $pkgdir = 'djgpp'; // djgpp_* packages put their files in djgpp
343
  if (str_head_is($pkgnam, 'djgpp_')) $pkgdir = 'djgpp'; // djgpp_* packages put their files in djgpp
344
  if ($pkgnam == 'fbc_help') $pkgdir = 'fbc'; // FreeBASIC help goes to the FreeBASIC dir
344
  if ($pkgnam == 'fbc_help') $pkgdir = 'fbc'; // FreeBASIC help goes to the FreeBASIC dir
345
  if ($pkgnam == 'clamdb') $pkgdir = 'clamav'; // data patterns for clamav
345
  if ($pkgnam == 'clamdb') $pkgdir = 'clamav'; // data patterns for clamav
346
 
346
 
347
  // array used to detect duplicated entries after lower-case conversion
347
  // array used to detect duplicated entries after lower-case conversion
348
  $duparr = array();
348
  $duparr = array();
349
 
349
 
350
  // will hold the list of categories that this package belongs to
350
  // will hold the list of categories that this package belongs to
351
  $catlist = array();
351
  $catlist = array();
352
 
352
 
353
  foreach ($listoffiles as $f) {
353
  foreach ($listoffiles as $f) {
354
    $f = strtolower($f);
354
    $f = strtolower($f);
355
    $path_array = explode('/', $f);
355
    $path_array = explode('/', $f);
356
    // emit a warning when non-8+3 filenames are spotted and find duplicates
356
    // emit a warning when non-8+3 filenames are spotted and find duplicates
357
    foreach ($path_array as $item) {
357
    foreach ($path_array as $item) {
358
      if (empty($item)) continue; // skip empty items at end of paths (eg. appinfo/)
358
      if (empty($item)) continue; // skip empty items at end of paths (eg. appinfo/)
359
      if (!preg_match("/[a-z0-9!#$%&'()@^_`{}~-]{1,8}(\.[a-z0-9!#$%&'()@^_`{}~-]{1,3}){0,1}/", $item)) {
359
      if (!preg_match("/[a-z0-9!#$%&'()@^_`{}~-]{1,8}(\.[a-z0-9!#$%&'()@^_`{}~-]{1,3}){0,1}/", $item)) {
360
        echo "WARNING: {$fname} contains a non-8+3 path (or weird char): {$item} (in $f)\n";
360
        echo "WARNING: {$fname} contains a non-8+3 path (or weird char): {$item} (in $f)\n";
361
      }
361
      }
362
    }
362
    }
363
    // look for dups
363
    // look for dups
364
    if (array_search($f, $duparr) !== false) {
364
    if (array_search($f, $duparr) !== false) {
365
      echo "WARNING: {$fname} contains a duplicated entry: '{$f}'\n";
365
      echo "WARNING: {$fname} contains a duplicated entry: '{$f}'\n";
366
    } else {
366
    } else {
367
      $duparr[] = $f;
367
      $duparr[] = $f;
368
    }
368
    }
369
    // LSM file is ok
369
    // LSM file is ok
370
    if ($f === "appinfo/{$pkgnam}.lsm") continue;
370
    if ($f === "appinfo/{$pkgnam}.lsm") continue;
371
    if ($f === "appinfo/") continue;
371
    if ($f === "appinfo/") continue;
372
    // CORE and MSDOS_COMPAT packages are premium citizens and can do a little more
372
    // CORE and MSDOS_COMPAT packages are premium citizens and can do a little more
373
    $core_or_msdoscompat = 0;
373
    $core_or_msdoscompat = 0;
374
    if (array_search($pkgnam, $core_packages_list) !== false) {
374
    if (array_search($pkgnam, $core_packages_list) !== false) {
375
      $catlist[] = 'core';
375
      $catlist[] = 'core';
376
      $core_or_msdoscompat = 1;
376
      $core_or_msdoscompat = 1;
377
    }
377
    }
378
    if (array_search($pkgnam, $msdos_compat_list) !== false) {
378
    if (array_search($pkgnam, $msdos_compat_list) !== false) {
379
      $catlist[] = 'msdos_compat';
379
      $catlist[] = 'msdos_compat';
380
      $core_or_msdoscompat = 1;
380
      $core_or_msdoscompat = 1;
381
    }
381
    }
382
    if ($core_or_msdoscompat == 1) {
382
    if ($core_or_msdoscompat == 1) {
383
      if (str_head_is($f, 'bin/')) continue;
383
      if (str_head_is($f, 'bin/')) continue;
384
      if (str_head_is($f, 'cpi/')) continue;
384
      if (str_head_is($f, 'cpi/')) continue;
385
      if (str_head_is($f, "doc/{$pkgdir}/")) continue;
385
      if (str_head_is($f, "doc/{$pkgdir}/")) continue;
386
      if ($f === 'doc/') continue;
386
      if ($f === 'doc/') continue;
387
      if (str_head_is($f, "nls/{$pkgdir}.")) continue;
387
      if (str_head_is($f, "nls/{$pkgdir}.")) continue;
388
      if ($f === 'nls/') continue;
388
      if ($f === 'nls/') continue;
389
    }
389
    }
390
    // the help package is allowed to put files in... help
390
    // the help package is allowed to put files in... help
391
    if (($pkgnam == 'help') && (str_head_is($f, 'help/'))) continue;
391
    if (($pkgnam == 'help') && (str_head_is($f, 'help/'))) continue;
392
    // must be category-prefixed file, add it to the list of categories for this package
392
    // must be category-prefixed file, add it to the list of categories for this package
393
    $catlist[] = explode('/', $f)[0];
393
    $catlist[] = explode('/', $f)[0];
394
    // well-known "category" dirs are okay
394
    // well-known "category" dirs are okay
395
    if (str_head_is($f, "progs/{$pkgdir}/")) continue;
395
    if (str_head_is($f, "progs/{$pkgdir}/")) continue;
396
    if ($f === 'progs/') continue;
396
    if ($f === 'progs/') continue;
397
    if (str_head_is($f, "devel/{$pkgdir}/")) continue;
397
    if (str_head_is($f, "devel/{$pkgdir}/")) continue;
398
    if ($f === 'devel/') continue;
398
    if ($f === 'devel/') continue;
399
    if (str_head_is($f, "games/{$pkgdir}/")) continue;
399
    if (str_head_is($f, "games/{$pkgdir}/")) continue;
400
    if ($f === 'games/') continue;
400
    if ($f === 'games/') continue;
401
    if (str_head_is($f, "drivers/{$pkgdir}/")) continue;
401
    if (str_head_is($f, "drivers/{$pkgdir}/")) continue;
402
    if ($f === 'drivers/') continue;
402
    if ($f === 'drivers/') continue;
403
    echo "WARNING: {$fname} contains a file in an illegal location: {$f}\n";
403
    echo "WARNING: {$fname} contains a file in an illegal location: {$f}\n";
404
  }
404
  }
405
 
405
 
406
  // do I understand the version string?
406
  // do I understand the version string?
407
  if (vertoarr($lsmarray['version']) === false) echo "WARNING: {$fname} parsing of version string failed ('{$lsmarray['version']}')\n";
407
  if (vertoarr($lsmarray['version']) === false) echo "WARNING: {$fname} parsing of version string failed ('{$lsmarray['version']}')\n";
408
 
408
 
409
  $meta['fname'] = $fname;
409
  $meta['fname'] = $fname;
410
  $meta['desc'] = $lsmarray['description'];
410
  $meta['desc'] = $lsmarray['description'];
411
  $meta['cats'] = array_unique($catlist);
411
  $meta['cats'] = array_unique($catlist);
412
 
412
 
413
  $pkgdb[$pkgnam][$lsmarray['version']] = $meta;
413
  $pkgdb[$pkgnam][$lsmarray['version']] = $meta;
414
}
414
}
415
 
415
 
416
 
416
 
417
$db = array();
417
$db = array();
418
$cats = array();
418
$cats = array();
419
 
419
 
420
// ******** compute the version-sorted list of packages with a single *********
420
// ******** compute the version-sorted list of packages with a single *********
421
// ******** description and category list for each package ********************
421
// ******** description and category list for each package ********************
422
 
422
 
423
// iterate over each svp package
423
// iterate over each svp package
424
foreach ($pkgdb as $pkg => $versions) {
424
foreach ($pkgdb as $pkg => $versions) {
425
 
425
 
426
  // sort filenames by version, highest first
426
  // sort filenames by version, highest first
427
  uksort($versions, "dos_version_compare");
427
  uksort($versions, "dos_version_compare");
428
  $versions = array_reverse($versions, true);
428
  $versions = array_reverse($versions, true);
429
 
429
 
430
  foreach ($versions as $ver => $meta) {
430
  foreach ($versions as $ver => $meta) {
431
    $fname = $meta['fname'];
431
    $fname = $meta['fname'];
432
    $desc = $meta['desc'];
432
    $desc = $meta['desc'];
433
 
433
 
434
    $bsum = file2bsum(realpath($repodir . '/' . $fname));
434
    $bsum = file2bsum(realpath($repodir . '/' . $fname));
435
 
435
 
436
    $meta2['ver'] = strval($ver);
436
    $meta2['ver'] = strval($ver);
437
    $meta2['bsum'] = $bsum;
437
    $meta2['bsum'] = $bsum;
438
 
438
 
439
    if (empty($db[$pkg]['desc'])) $db[$pkg]['desc'] = $desc;
439
    if (empty($db[$pkg]['desc'])) $db[$pkg]['desc'] = $desc;
440
    if (empty($db[$pkg]['cats'])) {
440
    if (empty($db[$pkg]['cats'])) {
441
      $db[$pkg]['cats'] = $meta['cats'];
441
      $db[$pkg]['cats'] = $meta['cats'];
442
      $cats = array_unique(array_merge($cats, $meta['cats']));
442
      $cats = array_unique(array_merge($cats, $meta['cats']));
443
    }
443
    }
444
    $db[$pkg]['versions'][$fname] = $meta2;
444
    $db[$pkg]['versions'][$fname] = $meta2;
445
  }
445
  }
446
 
446
 
447
  $pkgcount++;
447
  $pkgcount++;
448
 
448
 
449
}
449
}
450
 
450
 
451
if ($pkgcount < 100) echo "WARNING: an unexpectedly low number of packages has been found in the repo ({$pkgcount})\n";
451
if ($pkgcount < 100) echo "WARNING: an unexpectedly low number of packages has been found in the repo ({$pkgcount})\n";
452
 
452
 
453
$json_blob = json_encode($db);
453
$json_blob = json_encode($db);
454
if ($json_blob === false) {
454
if ($json_blob === false) {
455
  echo "ERROR: JSON convertion failed! -> ";
455
  echo "ERROR: JSON convertion failed! -> ";
456
  switch (json_last_error()) {
456
  switch (json_last_error()) {
457
    case JSON_ERROR_DEPTH:
457
    case JSON_ERROR_DEPTH:
458
      echo 'maximum stack depth exceeded';
458
      echo 'maximum stack depth exceeded';
459
      break;
459
      break;
460
    case JSON_ERROR_STATE_MISMATCH:
460
    case JSON_ERROR_STATE_MISMATCH:
461
      echo 'underflow of the modes mismatch';
461
      echo 'underflow of the modes mismatch';
462
      break;
462
      break;
463
    case JSON_ERROR_CTRL_CHAR:
463
    case JSON_ERROR_CTRL_CHAR:
464
      echo 'unexpected control character found';
464
      echo 'unexpected control character found';
465
      break;
465
      break;
466
    case JSON_ERROR_UTF8:
466
    case JSON_ERROR_UTF8:
467
      echo 'malformed utf-8 characters';
467
      echo 'malformed utf-8 characters';
468
      break;
468
      break;
469
    default:
469
    default:
470
      echo "unknown error";
470
      echo "unknown error";
471
      break;
471
      break;
472
  }
472
  }
473
  echo "\n";
473
  echo "\n";
474
}
474
}
475
 
475
 
476
file_put_contents($repodir . '/_index.json', $json_blob);
476
file_put_contents($repodir . '/_index.json', $json_blob);
477
 
477
 
478
$cats_json = json_encode($cats);
478
$cats_json = json_encode($cats);
479
file_put_contents($repodir . '/_cats.json', $cats_json);
479
file_put_contents($repodir . '/_cats.json', $cats_json);
480
 
480
 
481
exit(0);
481
exit(0);
482
 
482
 
483
?>
483
?>
484
 
484