| 1 | /* |
| 2 | * Copyright (C) 2002 Cyrus Patel <cyp@fb14.uni-mainz.de> |
| 3 | * (C) 2007, 2013 Apple Inc. All rights reserved. |
| 4 | * |
| 5 | * This library is free software; you can redistribute it and/or |
| 6 | * modify it under the terms of the GNU Lesser General Public |
| 7 | * License 2.1 as published by the Free Software Foundation. |
| 8 | * |
| 9 | * This library is distributed in the hope that it will be useful, |
| 10 | * but WITHOUT ANY WARRANTY; without even the implied warranty of |
| 11 | * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU |
| 12 | * Library General Public License for more details. |
| 13 | * |
| 14 | * You should have received a copy of the GNU Library General Public License |
| 15 | * along with this library; see the file COPYING.LIB. If not, write to |
| 16 | * the Free Software Foundation, Inc., 51 Franklin Street, Fifth Floor, |
| 17 | * Boston, MA 02110-1301, USA. |
| 18 | */ |
| 19 | |
| 20 | // This was originally Mozilla code, titled ParseFTPList.cpp |
| 21 | // Original version of this file can currently be found at: http://mxr.mozilla.org/mozilla1.8/source/netwerk/streamconv/converters/ParseFTPList.cpp |
| 22 | |
| 23 | #include "config.h" |
| 24 | #if ENABLE(FTPDIR) |
| 25 | #include "FTPDirectoryParser.h" |
| 26 | |
| 27 | // On Windows, use the threadsafe *_r functions provided by pthread. |
| 28 | #if OS(WINDOWS) && (USE(PTHREADS) || HAVE(PTHREAD_H)) |
| 29 | #include <pthread.h> |
| 30 | #endif |
| 31 | |
| 32 | #include <wtf/ASCIICType.h> |
| 33 | #include <stdio.h> |
| 34 | |
| 35 | |
| 36 | namespace WebCore { |
| 37 | |
| 38 | #if OS(WINDOWS) && !defined(gmtime_r) |
| 39 | #define gmtime_r(x, y) gmtime_s((y), (x)) |
| 40 | #endif |
| 41 | |
| 42 | static inline FTPEntryType ParsingFailed(ListState& state) |
| 43 | { |
| 44 | if (state.parsedOne || state.listStyle) /* junk if we fail to parse */ |
| 45 | return FTPJunkEntry; /* this time but had previously parsed sucessfully */ |
| 46 | return FTPMiscEntry; /* its part of a comment or error message */ |
| 47 | } |
| 48 | |
| 49 | FTPEntryType parseOneFTPLine(const char* line, ListState& state, ListResult& result) |
| 50 | { |
| 51 | result.clear(); |
| 52 | |
| 53 | if (!line) |
| 54 | return FTPJunkEntry; |
| 55 | |
| 56 | state.numLines++; |
| 57 | |
| 58 | /* carry buffer is only valid from one line to the next */ |
| 59 | unsigned int carry_buf_len = state.carryBufferLength; |
| 60 | state.carryBufferLength = 0; |
| 61 | |
| 62 | unsigned linelen = 0; |
| 63 | |
| 64 | /* strip leading whitespace */ |
| 65 | while (*line == ' ' || *line == '\t') |
| 66 | line++; |
| 67 | |
| 68 | /* line is terminated at first '\0' or '\n' */ |
| 69 | const char* p = line; |
| 70 | while (*p && *p != '\n') |
| 71 | p++; |
| 72 | linelen = p - line; |
| 73 | |
| 74 | if (linelen > 0 && *p == '\n' && *(p-1) == '\r') |
| 75 | linelen--; |
| 76 | |
| 77 | /* DON'T strip trailing whitespace. */ |
| 78 | |
| 79 | if (linelen > 0) |
| 80 | { |
| 81 | static const char *month_names = "JanFebMarAprMayJunJulAugSepOctNovDec" ; |
| 82 | const char *tokens[16]; /* 16 is more than enough */ |
| 83 | unsigned int toklen[WTF_ARRAY_LENGTH(tokens)]; |
| 84 | unsigned int linelen_sans_wsp; // line length sans whitespace |
| 85 | unsigned int numtoks = 0; |
| 86 | unsigned int tokmarker = 0; /* extra info for lstyle handler */ |
| 87 | unsigned int month_num = 0; |
| 88 | char tbuf[4]; |
| 89 | int lstyle = 0; |
| 90 | |
| 91 | if (carry_buf_len) /* VMS long filename carryover buffer */ |
| 92 | { |
| 93 | tokens[0] = state.carryBuffer; |
| 94 | toklen[0] = carry_buf_len; |
| 95 | numtoks++; |
| 96 | } |
| 97 | |
| 98 | unsigned int pos = 0; |
| 99 | while (pos < linelen && numtoks < WTF_ARRAY_LENGTH(tokens)) |
| 100 | { |
| 101 | while (pos < linelen && |
| 102 | (line[pos] == ' ' || line[pos] == '\t' || line[pos] == '\r')) |
| 103 | pos++; |
| 104 | if (pos < linelen) |
| 105 | { |
| 106 | tokens[numtoks] = &line[pos]; |
| 107 | while (pos < linelen && |
| 108 | (line[pos] != ' ' && line[pos] != '\t' && line[pos] != '\r')) |
| 109 | pos++; |
| 110 | if (tokens[numtoks] != &line[pos]) |
| 111 | { |
| 112 | toklen[numtoks] = (&line[pos] - tokens[numtoks]); |
| 113 | numtoks++; |
| 114 | } |
| 115 | } |
| 116 | } |
| 117 | |
| 118 | if (!numtoks) |
| 119 | return ParsingFailed(state); |
| 120 | |
| 121 | linelen_sans_wsp = &(tokens[numtoks-1][toklen[numtoks-1]]) - tokens[0]; |
| 122 | if (numtoks == WTF_ARRAY_LENGTH(tokens)) |
| 123 | { |
| 124 | pos = linelen; |
| 125 | while (pos > 0 && (line[pos-1] == ' ' || line[pos-1] == '\t')) |
| 126 | pos--; |
| 127 | linelen_sans_wsp = pos; |
| 128 | } |
| 129 | |
| 130 | /* +++++++++++++++++++++++++++++++++++++++++++++++++++++++++++ */ |
| 131 | #if defined(SUPPORT_EPLF) |
| 132 | /* EPLF handling must come somewhere before /bin/dls handling. */ |
| 133 | if (!lstyle && (!state.listStyle || state.listStyle == 'E')) |
| 134 | { |
| 135 | if (*line == '+' && linelen > 4 && numtoks >= 2) |
| 136 | { |
| 137 | pos = 1; |
| 138 | while (pos < (linelen-1)) |
| 139 | { |
| 140 | p = &line[pos++]; |
| 141 | if (*p == '/') |
| 142 | result.type = FTPDirectoryEntry; /* its a dir */ |
| 143 | else if (*p == 'r') |
| 144 | result.type = FTPFileEntry; /* its a file */ |
| 145 | else if (*p == 'm') |
| 146 | { |
| 147 | if (isASCIIDigit(line[pos])) |
| 148 | { |
| 149 | while (pos < linelen && isASCIIDigit(line[pos])) |
| 150 | pos++; |
| 151 | if (pos < linelen && line[pos] == ',') |
| 152 | { |
| 153 | unsigned long long seconds = 0; |
| 154 | sscanf(p + 1, "%llu" , &seconds); |
| 155 | time_t t = static_cast<time_t>(seconds); |
| 156 | |
| 157 | // FIXME: This code has the year 2038 bug |
| 158 | gmtime_r(&t, &result.modifiedTime); |
| 159 | result.modifiedTime.tm_year += 1900; |
| 160 | } |
| 161 | } |
| 162 | } |
| 163 | else if (*p == 's') |
| 164 | { |
| 165 | if (isASCIIDigit(line[pos])) |
| 166 | { |
| 167 | while (pos < linelen && isASCIIDigit(line[pos])) |
| 168 | pos++; |
| 169 | if (pos < linelen && line[pos] == ',') |
| 170 | result.fileSize = String(p + 1, &line[pos] - p + 1); |
| 171 | } |
| 172 | } |
| 173 | else if (isASCIIAlpha(*p)) /* 'i'/'up' or unknown "fact" (property) */ |
| 174 | { |
| 175 | while (pos < linelen && *++p != ',') |
| 176 | pos++; |
| 177 | } |
| 178 | else if (*p != '\t' || (p+1) != tokens[1]) |
| 179 | { |
| 180 | break; /* its not EPLF after all */ |
| 181 | } |
| 182 | else |
| 183 | { |
| 184 | state.parsedOne = true; |
| 185 | state.listStyle = lstyle = 'E'; |
| 186 | |
| 187 | p = &(line[linelen_sans_wsp]); |
| 188 | result.filename = tokens[1]; |
| 189 | result.filenameLength = p - tokens[1]; |
| 190 | |
| 191 | if (!result.type) /* access denied */ |
| 192 | { |
| 193 | result.type = FTPFileEntry; /* is assuming 'f'ile correct? */ |
| 194 | return FTPJunkEntry; /* NO! junk it. */ |
| 195 | } |
| 196 | return result.type; |
| 197 | } |
| 198 | if (pos >= (linelen-1) || line[pos] != ',') |
| 199 | break; |
| 200 | pos++; |
| 201 | } /* while (pos < linelen) */ |
| 202 | result.clear(); |
| 203 | } /* if (*line == '+' && linelen > 4 && numtoks >= 2) */ |
| 204 | } /* if (!lstyle && (!state.listStyle || state.listStyle == 'E')) */ |
| 205 | #endif /* SUPPORT_EPLF */ |
| 206 | |
| 207 | /* +++++++++++++++++++++++++++++++++++++++++++++++++++++++++++ */ |
| 208 | |
| 209 | #if defined(SUPPORT_VMS) |
| 210 | if (!lstyle && (!state.listStyle || state.listStyle == 'V')) |
| 211 | { /* try VMS Multinet/UCX/CMS server */ |
| 212 | /* |
| 213 | * Legal characters in a VMS file/dir spec are [A-Z0-9$.-_~]. |
| 214 | * '$' cannot begin a filename and `-' cannot be used as the first |
| 215 | * or last character. '.' is only valid as a directory separator |
| 216 | * and <file>.<type> separator. A canonical filename spec might look |
| 217 | * like this: DISK$VOL:[DIR1.DIR2.DIR3]FILE.TYPE;123 |
| 218 | * All VMS FTP servers LIST in uppercase. |
| 219 | * |
| 220 | * We need to be picky about this in order to support |
| 221 | * multi-line listings correctly. |
| 222 | */ |
| 223 | if (!state.parsedOne && |
| 224 | (numtoks == 1 || (numtoks == 2 && toklen[0] == 9 && |
| 225 | memcmp(tokens[0], "Directory" , 9)==0 ))) |
| 226 | { |
| 227 | /* If no dirstyle has been detected yet, and this line is a |
| 228 | * VMS list's dirname, then turn on VMS dirstyle. |
| 229 | * eg "ACA:[ANONYMOUS]", "DISK$FTP:[ANONYMOUS]", "SYS$ANONFTP:" |
| 230 | */ |
| 231 | p = tokens[0]; |
| 232 | pos = toklen[0]; |
| 233 | if (numtoks == 2) |
| 234 | { |
| 235 | p = tokens[1]; |
| 236 | pos = toklen[1]; |
| 237 | } |
| 238 | pos--; |
| 239 | if (pos >= 3) |
| 240 | { |
| 241 | while (pos > 0 && p[pos] != '[') |
| 242 | { |
| 243 | pos--; |
| 244 | if (p[pos] == '-' || p[pos] == '$') |
| 245 | { |
| 246 | if (pos == 0 || p[pos-1] == '[' || p[pos-1] == '.' || |
| 247 | (p[pos] == '-' && (p[pos+1] == ']' || p[pos+1] == '.'))) |
| 248 | break; |
| 249 | } |
| 250 | else if (p[pos] != '.' && p[pos] != '~' && |
| 251 | !isASCIIDigit(p[pos]) && !isASCIIAlpha(p[pos])) |
| 252 | break; |
| 253 | else if (isASCIIAlpha(p[pos]) && p[pos] != toASCIIUpper(p[pos])) |
| 254 | break; |
| 255 | } |
| 256 | if (pos > 0) |
| 257 | { |
| 258 | pos--; |
| 259 | if (p[pos] != ':' || p[pos+1] != '[') |
| 260 | pos = 0; |
| 261 | } |
| 262 | } |
| 263 | if (pos > 0 && p[pos] == ':') |
| 264 | { |
| 265 | while (pos > 0) |
| 266 | { |
| 267 | pos--; |
| 268 | if (p[pos] != '$' && p[pos] != '_' && p[pos] != '-' && |
| 269 | p[pos] != '~' && !isASCIIDigit(p[pos]) && !isASCIIAlpha(p[pos])) |
| 270 | break; |
| 271 | else if (isASCIIAlpha(p[pos]) && p[pos] != toASCIIUpper(p[pos])) |
| 272 | break; |
| 273 | } |
| 274 | if (pos == 0) |
| 275 | { |
| 276 | state.listStyle = 'V'; |
| 277 | return FTPJunkEntry; /* its junk */ |
| 278 | } |
| 279 | } |
| 280 | /* fallthrough */ |
| 281 | } |
| 282 | else if ((tokens[0][toklen[0]-1]) != ';') |
| 283 | { |
| 284 | if (numtoks == 1 && (state.listStyle == 'V' && !carry_buf_len)) |
| 285 | lstyle = 'V'; |
| 286 | else if (numtoks < 4) |
| 287 | ; |
| 288 | else if (toklen[1] >= 10 && memcmp(tokens[1], "%RMS-E-PRV" , 10) == 0) |
| 289 | lstyle = 'V'; |
| 290 | else if ((&line[linelen] - tokens[1]) >= 22 && |
| 291 | memcmp(tokens[1], "insufficient privilege" , 22) == 0) |
| 292 | lstyle = 'V'; |
| 293 | else if (numtoks != 4 && numtoks != 6) |
| 294 | ; |
| 295 | else if (numtoks == 6 && ( |
| 296 | toklen[5] < 4 || *tokens[5] != '(' || /* perms */ |
| 297 | (tokens[5][toklen[5]-1]) != ')' )) |
| 298 | ; |
| 299 | else if ( (toklen[2] == 10 || toklen[2] == 11) && |
| 300 | (tokens[2][toklen[2]-5]) == '-' && |
| 301 | (tokens[2][toklen[2]-9]) == '-' && |
| 302 | (((toklen[3]==4 || toklen[3]==5 || toklen[3]==7 || toklen[3]==8) && |
| 303 | (tokens[3][toklen[3]-3]) == ':' ) || |
| 304 | ((toklen[3]==10 || toklen[3]==11 ) && |
| 305 | (tokens[3][toklen[3]-3]) == '.' ) |
| 306 | ) && /* time in [H]H:MM[:SS[.CC]] format */ |
| 307 | isASCIIDigit(*tokens[1]) && /* size */ |
| 308 | isASCIIDigit(*tokens[2]) && /* date */ |
| 309 | isASCIIDigit(*tokens[3]) /* time */ |
| 310 | ) |
| 311 | { |
| 312 | lstyle = 'V'; |
| 313 | } |
| 314 | if (lstyle == 'V') |
| 315 | { |
| 316 | /* |
| 317 | * MultiNet FTP: |
| 318 | * LOGIN.COM;2 1 4-NOV-1994 04:09 [ANONYMOUS] (RWE,RWE,,) |
| 319 | * PUB.DIR;1 1 27-JAN-1994 14:46 [ANONYMOUS] (RWE,RWE,RE,RWE) |
| 320 | * README.FTP;1 %RMS-E-PRV, insufficient privilege or file protection violation |
| 321 | * ROUSSOS.DIR;1 1 27-JAN-1994 14:48 [CS,ROUSSOS] (RWE,RWE,RE,R) |
| 322 | * S67-50903.JPG;1 328 22-SEP-1998 16:19 [ANONYMOUS] (RWED,RWED,,) |
| 323 | * UCX FTP: |
| 324 | * CII-MANUAL.TEX;1 213/216 29-JAN-1996 03:33:12 [ANONYMOU,ANONYMOUS] (RWED,RWED,,) |
| 325 | * CMU/VMS-IP FTP |
| 326 | * [VMSSERV.FILES]ALARM.DIR;1 1/3 5-MAR-1993 18:09 |
| 327 | * TCPware FTP |
| 328 | * FOO.BAR;1 4 5-MAR-1993 18:09:01.12 |
| 329 | * Long filename example: |
| 330 | * THIS-IS-A-LONG-VMS-FILENAME.AND-THIS-IS-A-LONG-VMS-FILETYPE\r\n |
| 331 | * 213[/nnn] 29-JAN-1996 03:33[:nn] [ANONYMOU,ANONYMOUS] (RWED,RWED,,) |
| 332 | */ |
| 333 | tokmarker = 0; |
| 334 | p = tokens[0]; |
| 335 | pos = 0; |
| 336 | if (*p == '[' && toklen[0] >= 4) /* CMU style */ |
| 337 | { |
| 338 | if (p[1] != ']') |
| 339 | { |
| 340 | p++; |
| 341 | pos++; |
| 342 | } |
| 343 | while (lstyle && pos < toklen[0] && *p != ']') |
| 344 | { |
| 345 | if (*p != '$' && *p != '.' && *p != '_' && *p != '-' && |
| 346 | *p != '~' && !isASCIIDigit(*p) && !isASCIIAlpha(*p)) |
| 347 | lstyle = 0; |
| 348 | pos++; |
| 349 | p++; |
| 350 | } |
| 351 | if (lstyle && pos < (toklen[0]-1)) |
| 352 | { |
| 353 | /* ']' was found and there is at least one character after it */ |
| 354 | ASSERT(*p == ']'); |
| 355 | pos++; |
| 356 | p++; |
| 357 | tokmarker = pos; /* length of leading "[DIR1.DIR2.etc]" */ |
| 358 | } else { |
| 359 | /* not a CMU style listing */ |
| 360 | lstyle = 0; |
| 361 | } |
| 362 | } |
| 363 | while (lstyle && pos < toklen[0] && *p != ';') |
| 364 | { |
| 365 | if (*p != '$' && *p != '.' && *p != '_' && *p != '-' && |
| 366 | *p != '~' && !isASCIIDigit(*p) && !isASCIIAlpha(*p)) |
| 367 | lstyle = 0; |
| 368 | else if (isASCIIAlpha(*p) && *p != toASCIIUpper(*p)) |
| 369 | lstyle = 0; |
| 370 | p++; |
| 371 | pos++; |
| 372 | } |
| 373 | if (lstyle && *p == ';') |
| 374 | { |
| 375 | if (pos == 0 || pos == (toklen[0]-1)) |
| 376 | lstyle = 0; |
| 377 | for (pos++;lstyle && pos < toklen[0];pos++) |
| 378 | { |
| 379 | if (!isASCIIDigit(tokens[0][pos])) |
| 380 | lstyle = 0; |
| 381 | } |
| 382 | } |
| 383 | pos = (p - tokens[0]); /* => fnlength sans ";####" */ |
| 384 | pos -= tokmarker; /* => fnlength sans "[DIR1.DIR2.etc]" */ |
| 385 | p = &(tokens[0][tokmarker]); /* offset of basename */ |
| 386 | |
| 387 | if (!lstyle || pos == 0 || pos > 80) /* VMS filenames can't be longer than that */ |
| 388 | { |
| 389 | lstyle = 0; |
| 390 | } |
| 391 | else if (numtoks == 1) |
| 392 | { |
| 393 | /* if VMS has been detected and there is only one token and that |
| 394 | * token was a VMS filename then this is a multiline VMS LIST entry. |
| 395 | */ |
| 396 | if (pos >= (sizeof(state.carryBuffer)-1)) |
| 397 | pos = (sizeof(state.carryBuffer)-1); /* shouldn't happen */ |
| 398 | memcpy( state.carryBuffer, p, pos ); |
| 399 | state.carryBufferLength = pos; |
| 400 | return FTPJunkEntry; /* tell caller to treat as junk */ |
| 401 | } |
| 402 | else if (isASCIIDigit(*tokens[1])) /* not no-privs message */ |
| 403 | { |
| 404 | for (pos = 0; lstyle && pos < (toklen[1]); pos++) |
| 405 | { |
| 406 | if (!isASCIIDigit((tokens[1][pos])) && (tokens[1][pos]) != '/') |
| 407 | lstyle = 0; |
| 408 | } |
| 409 | if (lstyle && numtoks > 4) /* Multinet or UCX but not CMU */ |
| 410 | { |
| 411 | for (pos = 1; lstyle && pos < (toklen[5]-1); pos++) |
| 412 | { |
| 413 | p = &(tokens[5][pos]); |
| 414 | if (*p!='R' && *p!='W' && *p!='E' && *p!='D' && *p!=',') |
| 415 | lstyle = 0; |
| 416 | } |
| 417 | } |
| 418 | } |
| 419 | } /* passed initial tests */ |
| 420 | } /* else if ((tokens[0][toklen[0]-1]) != ';') */ |
| 421 | |
| 422 | if (lstyle == 'V') |
| 423 | { |
| 424 | state.parsedOne = true; |
| 425 | state.listStyle = lstyle; |
| 426 | |
| 427 | if (isASCIIDigit(*tokens[1])) /* not permission denied etc */ |
| 428 | { |
| 429 | /* strip leading directory name */ |
| 430 | if (*tokens[0] == '[') /* CMU server */ |
| 431 | { |
| 432 | pos = toklen[0]-1; |
| 433 | p = tokens[0]+1; |
| 434 | while (*p != ']') |
| 435 | { |
| 436 | p++; |
| 437 | pos--; |
| 438 | } |
| 439 | toklen[0] = --pos; |
| 440 | tokens[0] = ++p; |
| 441 | } |
| 442 | pos = 0; |
| 443 | while (pos < toklen[0] && (tokens[0][pos]) != ';') |
| 444 | pos++; |
| 445 | |
| 446 | result.caseSensitive = true; |
| 447 | result.type = FTPFileEntry; |
| 448 | result.filename = tokens[0]; |
| 449 | result.filenameLength = pos; |
| 450 | |
| 451 | if (pos > 4) |
| 452 | { |
| 453 | p = &(tokens[0][pos-4]); |
| 454 | if (p[0] == '.' && p[1] == 'D' && p[2] == 'I' && p[3] == 'R') |
| 455 | { |
| 456 | result.filenameLength -= 4; |
| 457 | result.type = FTPDirectoryEntry; |
| 458 | } |
| 459 | } |
| 460 | |
| 461 | if (result.type != FTPDirectoryEntry) |
| 462 | { |
| 463 | /* #### or used/allocated form. If used/allocated form, then |
| 464 | * 'used' is the size in bytes if and only if 'used'<=allocated. |
| 465 | * If 'used' is size in bytes then it can be > 2^32 |
| 466 | * If 'used' is not size in bytes then it is size in blocks. |
| 467 | */ |
| 468 | pos = 0; |
| 469 | while (pos < toklen[1] && (tokens[1][pos]) != '/') |
| 470 | pos++; |
| 471 | |
| 472 | /* |
| 473 | * I've never seen size come back in bytes, its always in blocks, and |
| 474 | * the following test fails. So, always perform the "size in blocks". |
| 475 | * I'm leaving the "size in bytes" code if'd out in case we ever need |
| 476 | * to re-instate it. |
| 477 | */ |
| 478 | #if 0 |
| 479 | if (pos < toklen[1] && ( (pos<<1) > (toklen[1]-1) || |
| 480 | (strtoul(tokens[1], (char **)0, 10) > |
| 481 | strtoul(tokens[1]+pos+1, (char **)0, 10)) )) |
| 482 | { /* size is in bytes */ |
| 483 | if (pos > (sizeof(result.fe_size)-1)) |
| 484 | pos = sizeof(result.fe_size)-1; |
| 485 | memcpy( result.fe_size, tokens[1], pos ); |
| 486 | result.fe_size[pos] = '\0'; |
| 487 | } |
| 488 | else /* size is in blocks */ |
| 489 | #endif |
| 490 | { |
| 491 | /* size requires multiplication by blocksize. |
| 492 | * |
| 493 | * We could assume blocksize is 512 (like Lynx does) and |
| 494 | * shift by 9, but that might not be right. Even if it |
| 495 | * were, doing that wouldn't reflect what the file's |
| 496 | * real size was. The sanest thing to do is not use the |
| 497 | * LISTing's filesize, so we won't (like ftpmirror). |
| 498 | * |
| 499 | * ulltoa(((unsigned long long)fsz)<<9, result.fe_size, 10); |
| 500 | * |
| 501 | * A block is always 512 bytes on OpenVMS, compute size. |
| 502 | * So its rounded up to the next block, so what, its better |
| 503 | * than not showing the size at all. |
| 504 | * A block is always 512 bytes on OpenVMS, compute size. |
| 505 | * So its rounded up to the next block, so what, its better |
| 506 | * than not showing the size at all. |
| 507 | */ |
| 508 | uint64_t size = strtoull(tokens[1], 0, 10) * 512; |
| 509 | result.fileSize = String::number(size); |
| 510 | } |
| 511 | |
| 512 | } /* if (result.type != FTPDirectoryEntry) */ |
| 513 | |
| 514 | p = tokens[2] + 2; |
| 515 | if (*p == '-') |
| 516 | p++; |
| 517 | tbuf[0] = p[0]; |
| 518 | tbuf[1] = toASCIILower(p[1]); |
| 519 | tbuf[2] = toASCIILower(p[2]); |
| 520 | month_num = 0; |
| 521 | for (pos = 0; pos < (12*3); pos+=3) |
| 522 | { |
| 523 | if (tbuf[0] == month_names[pos+0] && |
| 524 | tbuf[1] == month_names[pos+1] && |
| 525 | tbuf[2] == month_names[pos+2]) |
| 526 | break; |
| 527 | month_num++; |
| 528 | } |
| 529 | if (month_num >= 12) |
| 530 | month_num = 0; |
| 531 | result.modifiedTime.tm_mon = month_num; |
| 532 | result.modifiedTime.tm_mday = atoi(tokens[2]); |
| 533 | result.modifiedTime.tm_year = atoi(p+4); // NSPR wants year as XXXX |
| 534 | |
| 535 | p = tokens[3] + 2; |
| 536 | if (*p == ':') |
| 537 | p++; |
| 538 | if (p[2] == ':') |
| 539 | result.modifiedTime.tm_sec = atoi(p+3); |
| 540 | result.modifiedTime.tm_hour = atoi(tokens[3]); |
| 541 | result.modifiedTime.tm_min = atoi(p); |
| 542 | |
| 543 | return result.type; |
| 544 | |
| 545 | } /* if (isASCIIDigit(*tokens[1])) */ |
| 546 | |
| 547 | return FTPJunkEntry; /* junk */ |
| 548 | |
| 549 | } /* if (lstyle == 'V') */ |
| 550 | } /* if (!lstyle && (!state.listStyle || state.listStyle == 'V')) */ |
| 551 | #endif |
| 552 | |
| 553 | /* +++++++++++++++++++++++++++++++++++++++++++++++++++++++++++ */ |
| 554 | |
| 555 | #if defined(SUPPORT_CMS) |
| 556 | /* Virtual Machine/Conversational Monitor System (IBM Mainframe) */ |
| 557 | if (!lstyle && (!state.listStyle || state.listStyle == 'C')) /* VM/CMS */ |
| 558 | { |
| 559 | /* LISTing according to mirror.pl |
| 560 | * Filename FileType Fm Format Lrecl Records Blocks Date Time |
| 561 | * LASTING GLOBALV A1 V 41 21 1 9/16/91 15:10:32 |
| 562 | * J43401 NETLOG A0 V 77 1 1 9/12/91 12:36:04 |
| 563 | * PROFILE EXEC A1 V 17 3 1 9/12/91 12:39:07 |
| 564 | * DIRUNIX SCRIPT A1 V 77 1216 17 1/04/93 20:30:47 |
| 565 | * MAIL PROFILE A2 F 80 1 1 10/14/92 16:12:27 |
| 566 | * BADY2K TEXT A0 V 1 1 1 1/03/102 10:11:12 |
| 567 | * AUTHORS A1 DIR - - - 9/20/99 10:31:11 |
| 568 | * |
| 569 | * LISTing from vm.marist.edu and vm.sc.edu |
| 570 | * 220-FTPSERVE IBM VM Level 420 at VM.MARIST.EDU, 04:58:12 EDT WEDNESDAY 2002-07-10 |
| 571 | * AUTHORS DIR - - - 1999-09-20 10:31:11 - |
| 572 | * HARRINGTON DIR - - - 1997-02-12 15:33:28 - |
| 573 | * PICS DIR - - - 2000-10-12 15:43:23 - |
| 574 | * SYSFILE DIR - - - 2000-07-20 17:48:01 - |
| 575 | * WELCNVT EXEC V 72 9 1 1999-09-20 17:16:18 - |
| 576 | * WELCOME EREADME F 80 21 1 1999-12-27 16:19:00 - |
| 577 | * WELCOME README V 82 21 1 1999-12-27 16:19:04 - |
| 578 | * README ANONYMOU V 71 26 1 1997-04-02 12:33:20 TCP291 |
| 579 | * README ANONYOLD V 71 15 1 1995-08-25 16:04:27 TCP291 |
| 580 | */ |
| 581 | if (numtoks >= 7 && (toklen[0]+toklen[1]) <= 16) |
| 582 | { |
| 583 | for (pos = 1; !lstyle && (pos+5) < numtoks; pos++) |
| 584 | { |
| 585 | p = tokens[pos]; |
| 586 | if ((toklen[pos] == 1 && (*p == 'F' || *p == 'V')) || |
| 587 | (toklen[pos] == 3 && *p == 'D' && p[1] == 'I' && p[2] == 'R')) |
| 588 | { |
| 589 | if (toklen[pos+5] == 8 && (tokens[pos+5][2]) == ':' && |
| 590 | (tokens[pos+5][5]) == ':' ) |
| 591 | { |
| 592 | p = tokens[pos+4]; |
| 593 | if ((toklen[pos+4] == 10 && p[4] == '-' && p[7] == '-') || |
| 594 | (toklen[pos+4] >= 7 && toklen[pos+4] <= 9 && |
| 595 | p[((p[1]!='/')?(2):(1))] == '/' && |
| 596 | p[((p[1]!='/')?(5):(4))] == '/')) |
| 597 | /* Y2K bugs possible ("7/06/102" or "13/02/101") */ |
| 598 | { |
| 599 | if ( (*tokens[pos+1] == '-' && |
| 600 | *tokens[pos+2] == '-' && |
| 601 | *tokens[pos+3] == '-') || |
| 602 | (isASCIIDigit(*tokens[pos+1]) && |
| 603 | isASCIIDigit(*tokens[pos+2]) && |
| 604 | isASCIIDigit(*tokens[pos+3])) ) |
| 605 | { |
| 606 | lstyle = 'C'; |
| 607 | tokmarker = pos; |
| 608 | } |
| 609 | } |
| 610 | } |
| 611 | } |
| 612 | } /* for (pos = 1; !lstyle && (pos+5) < numtoks; pos++) */ |
| 613 | } /* if (numtoks >= 7) */ |
| 614 | |
| 615 | /* extra checking if first pass */ |
| 616 | if (lstyle && !state.listStyle) |
| 617 | { |
| 618 | for (pos = 0, p = tokens[0]; lstyle && pos < toklen[0]; pos++, p++) |
| 619 | { |
| 620 | if (isASCIIAlpha(*p) && toASCIIUpper(*p) != *p) |
| 621 | lstyle = 0; |
| 622 | } |
| 623 | for (pos = tokmarker+1; pos <= tokmarker+3; pos++) |
| 624 | { |
| 625 | if (!(toklen[pos] == 1 && *tokens[pos] == '-')) |
| 626 | { |
| 627 | for (p = tokens[pos]; lstyle && p<(tokens[pos]+toklen[pos]); p++) |
| 628 | { |
| 629 | if (!isASCIIDigit(*p)) |
| 630 | lstyle = 0; |
| 631 | } |
| 632 | } |
| 633 | } |
| 634 | for (pos = 0, p = tokens[tokmarker+4]; |
| 635 | lstyle && pos < toklen[tokmarker+4]; pos++, p++) |
| 636 | { |
| 637 | if (*p == '/') |
| 638 | { |
| 639 | /* There may be Y2K bugs in the date. Don't simplify to |
| 640 | * pos != (len-3) && pos != (len-6) like time is done. |
| 641 | */ |
| 642 | if ((tokens[tokmarker+4][1]) == '/') |
| 643 | { |
| 644 | if (pos != 1 && pos != 4) |
| 645 | lstyle = 0; |
| 646 | } |
| 647 | else if (pos != 2 && pos != 5) |
| 648 | lstyle = 0; |
| 649 | } |
| 650 | else if (*p != '-' && !isASCIIDigit(*p)) |
| 651 | lstyle = 0; |
| 652 | else if (*p == '-' && pos != 4 && pos != 7) |
| 653 | lstyle = 0; |
| 654 | } |
| 655 | for (pos = 0, p = tokens[tokmarker+5]; |
| 656 | lstyle && pos < toklen[tokmarker+5]; pos++, p++) |
| 657 | { |
| 658 | if (*p != ':' && !isASCIIDigit(*p)) |
| 659 | lstyle = 0; |
| 660 | else if (*p == ':' && pos != (toklen[tokmarker+5]-3) |
| 661 | && pos != (toklen[tokmarker+5]-6)) |
| 662 | lstyle = 0; |
| 663 | } |
| 664 | } /* initial if() */ |
| 665 | |
| 666 | if (lstyle == 'C') |
| 667 | { |
| 668 | state.parsedOne = true; |
| 669 | state.listStyle = lstyle; |
| 670 | |
| 671 | p = tokens[tokmarker+4]; |
| 672 | if (toklen[tokmarker+4] == 10) /* newstyle: YYYY-MM-DD format */ |
| 673 | { |
| 674 | result.modifiedTime.tm_year = atoi(p+0) - 1900; |
| 675 | result.modifiedTime.tm_mon = atoi(p+5) - 1; |
| 676 | result.modifiedTime.tm_mday = atoi(p+8); |
| 677 | } |
| 678 | else /* oldstyle: [M]M/DD/YY format */ |
| 679 | { |
| 680 | pos = toklen[tokmarker+4]; |
| 681 | result.modifiedTime.tm_mon = atoi(p) - 1; |
| 682 | result.modifiedTime.tm_mday = atoi((p+pos)-5); |
| 683 | result.modifiedTime.tm_year = atoi((p+pos)-2); |
| 684 | if (result.modifiedTime.tm_year < 70) |
| 685 | result.modifiedTime.tm_year += 100; |
| 686 | } |
| 687 | |
| 688 | p = tokens[tokmarker+5]; |
| 689 | pos = toklen[tokmarker+5]; |
| 690 | result.modifiedTime.tm_hour = atoi(p); |
| 691 | result.modifiedTime.tm_min = atoi((p+pos)-5); |
| 692 | result.modifiedTime.tm_sec = atoi((p+pos)-2); |
| 693 | |
| 694 | result.caseSensitive = true; |
| 695 | result.filename = tokens[0]; |
| 696 | result.filenameLength = toklen[0]; |
| 697 | result.type = FTPFileEntry; |
| 698 | |
| 699 | p = tokens[tokmarker]; |
| 700 | if (toklen[tokmarker] == 3 && *p=='D' && p[1]=='I' && p[2]=='R') |
| 701 | result.type = FTPDirectoryEntry; |
| 702 | |
| 703 | if ((/*newstyle*/ toklen[tokmarker+4] == 10 && tokmarker > 1) || |
| 704 | (/*oldstyle*/ toklen[tokmarker+4] != 10 && tokmarker > 2)) |
| 705 | { /* have a filetype column */ |
| 706 | char *dot; |
| 707 | p = &(tokens[0][toklen[0]]); |
| 708 | memcpy( &dot, &p, sizeof(dot) ); /* NASTY! */ |
| 709 | *dot++ = '.'; |
| 710 | p = tokens[1]; |
| 711 | for (pos = 0; pos < toklen[1]; pos++) |
| 712 | *dot++ = *p++; |
| 713 | result.filenameLength += 1 + toklen[1]; |
| 714 | } |
| 715 | |
| 716 | /* oldstyle LISTING: |
| 717 | * files/dirs not on the 'A' minidisk are not RETRievable/CHDIRable |
| 718 | if (toklen[tokmarker+4] != 10 && *tokens[tokmarker-1] != 'A') |
| 719 | return FTPJunkEntry; |
| 720 | */ |
| 721 | |
| 722 | /* VM/CMS LISTings have no usable filesize field. |
| 723 | * Have to use the 'SIZE' command for that. |
| 724 | */ |
| 725 | return result.type; |
| 726 | |
| 727 | } /* if (lstyle == 'C' && (!state.listStyle || state.listStyle == lstyle)) */ |
| 728 | } /* VM/CMS */ |
| 729 | #endif |
| 730 | |
| 731 | /* +++++++++++++++++++++++++++++++++++++++++++++++++++++++++++ */ |
| 732 | |
| 733 | #if defined(SUPPORT_DOS) /* WinNT DOS dirstyle */ |
| 734 | if (!lstyle && (!state.listStyle || state.listStyle == 'W')) |
| 735 | { |
| 736 | /* |
| 737 | * "10-23-00 01:27PM <DIR> veronist" |
| 738 | * "06-15-00 07:37AM <DIR> zoe" |
| 739 | * "07-14-00 01:35PM 2094926 canprankdesk.tif" |
| 740 | * "07-21-00 01:19PM 95077 Jon Kauffman Enjoys the Good Life.jpg" |
| 741 | * "07-21-00 01:19PM 52275 Name Plate.jpg" |
| 742 | * "07-14-00 01:38PM 2250540 Valentineoffprank-HiRes.jpg" |
| 743 | */ |
| 744 | if ((numtoks >= 4) && toklen[0] == 8 && toklen[1] == 7 && |
| 745 | (*tokens[2] == '<' || isASCIIDigit(*tokens[2])) ) |
| 746 | { |
| 747 | p = tokens[0]; |
| 748 | if ( isASCIIDigit(p[0]) && isASCIIDigit(p[1]) && p[2]=='-' && |
| 749 | isASCIIDigit(p[3]) && isASCIIDigit(p[4]) && p[5]=='-' && |
| 750 | isASCIIDigit(p[6]) && isASCIIDigit(p[7]) ) |
| 751 | { |
| 752 | p = tokens[1]; |
| 753 | if ( isASCIIDigit(p[0]) && isASCIIDigit(p[1]) && p[2]==':' && |
| 754 | isASCIIDigit(p[3]) && isASCIIDigit(p[4]) && |
| 755 | (p[5]=='A' || p[5]=='P') && p[6]=='M') |
| 756 | { |
| 757 | lstyle = 'W'; |
| 758 | if (!state.listStyle) |
| 759 | { |
| 760 | p = tokens[2]; |
| 761 | /* <DIR> or <JUNCTION> */ |
| 762 | if (*p != '<' || p[toklen[2]-1] != '>') |
| 763 | { |
| 764 | for (pos = 1; (lstyle && pos < toklen[2]); pos++) |
| 765 | { |
| 766 | if (!isASCIIDigit(*++p)) |
| 767 | lstyle = 0; |
| 768 | } |
| 769 | } |
| 770 | } |
| 771 | } |
| 772 | } |
| 773 | } |
| 774 | |
| 775 | if (lstyle == 'W') |
| 776 | { |
| 777 | state.parsedOne = true; |
| 778 | state.listStyle = lstyle; |
| 779 | |
| 780 | p = &(line[linelen]); /* line end */ |
| 781 | result.caseSensitive = true; |
| 782 | result.filename = tokens[3]; |
| 783 | result.filenameLength = p - tokens[3]; |
| 784 | result.type = FTPDirectoryEntry; |
| 785 | |
| 786 | if (*tokens[2] != '<') /* not <DIR> or <JUNCTION> */ |
| 787 | { |
| 788 | // try to handle correctly spaces at the beginning of the filename |
| 789 | // filesize (token[2]) must end at offset 38 |
| 790 | if (tokens[2] + toklen[2] - line == 38) { |
| 791 | result.filename = &(line[39]); |
| 792 | result.filenameLength = p - result.filename; |
| 793 | } |
| 794 | result.type = FTPFileEntry; |
| 795 | pos = toklen[2]; |
| 796 | result.fileSize = String(tokens[2], pos); |
| 797 | } |
| 798 | else { |
| 799 | // try to handle correctly spaces at the beginning of the filename |
| 800 | // token[2] must begin at offset 24, the length is 5 or 10 |
| 801 | // token[3] must begin at offset 39 or higher |
| 802 | if (tokens[2] - line == 24 && (toklen[2] == 5 || toklen[2] == 10) && |
| 803 | tokens[3] - line >= 39) { |
| 804 | result.filename = &(line[39]); |
| 805 | result.filenameLength = p - result.filename; |
| 806 | } |
| 807 | |
| 808 | if ((tokens[2][1]) != 'D') /* not <DIR> */ |
| 809 | { |
| 810 | result.type = FTPJunkEntry; /* unknown until junc for sure */ |
| 811 | if (result.filenameLength > 4) |
| 812 | { |
| 813 | p = result.filename; |
| 814 | for (pos = result.filenameLength - 4; pos > 0; pos--) |
| 815 | { |
| 816 | if (p[0] == ' ' && p[3] == ' ' && p[2] == '>' && |
| 817 | (p[1] == '=' || p[1] == '-')) |
| 818 | { |
| 819 | result.type = FTPLinkEntry; |
| 820 | result.filenameLength = p - result.filename; |
| 821 | result.linkname = p + 4; |
| 822 | result.linknameLength = &(line[linelen]) |
| 823 | - result.linkname; |
| 824 | break; |
| 825 | } |
| 826 | p++; |
| 827 | } |
| 828 | } |
| 829 | } |
| 830 | } |
| 831 | |
| 832 | result.modifiedTime.tm_mon = atoi(tokens[0]+0); |
| 833 | if (result.modifiedTime.tm_mon != 0) |
| 834 | { |
| 835 | result.modifiedTime.tm_mon--; |
| 836 | result.modifiedTime.tm_mday = atoi(tokens[0]+3); |
| 837 | result.modifiedTime.tm_year = atoi(tokens[0]+6); |
| 838 | /* if year has only two digits then assume that |
| 839 | 00-79 is 2000-2079 |
| 840 | 80-99 is 1980-1999 */ |
| 841 | if (result.modifiedTime.tm_year < 80) |
| 842 | result.modifiedTime.tm_year += 2000; |
| 843 | else if (result.modifiedTime.tm_year < 100) |
| 844 | result.modifiedTime.tm_year += 1900; |
| 845 | } |
| 846 | |
| 847 | result.modifiedTime.tm_hour = atoi(tokens[1]+0); |
| 848 | result.modifiedTime.tm_min = atoi(tokens[1]+3); |
| 849 | if ((tokens[1][5]) == 'P' && result.modifiedTime.tm_hour < 12) |
| 850 | result.modifiedTime.tm_hour += 12; |
| 851 | |
| 852 | /* the caller should do this (if dropping "." and ".." is desired) |
| 853 | if (result.type == FTPDirectoryEntry && result.filename[0] == '.' && |
| 854 | (result.filenameLength == 1 || (result.filenameLength == 2 && |
| 855 | result.filename[1] == '.'))) |
| 856 | return FTPJunkEntry; |
| 857 | */ |
| 858 | |
| 859 | return result.type; |
| 860 | } /* if (lstyle == 'W' && (!state.listStyle || state.listStyle == lstyle)) */ |
| 861 | } /* if (!lstyle && (!state.listStyle || state.listStyle == 'W')) */ |
| 862 | #endif |
| 863 | |
| 864 | /* +++++++++++++++++++++++++++++++++++++++++++++++++++++++++++ */ |
| 865 | |
| 866 | #if defined(SUPPORT_OS2) |
| 867 | if (!lstyle && (!state.listStyle || state.listStyle == 'O')) /* OS/2 test */ |
| 868 | { |
| 869 | /* 220 server IBM TCP/IP for OS/2 - FTP Server ver 23:04:36 on Jan 15 1997 ready. |
| 870 | * fixed position, space padded columns. I have only a vague idea |
| 871 | * of what the contents between col 18 and 34 might be: All I can infer |
| 872 | * is that there may be attribute flags in there and there may be |
| 873 | * a " DIR" in there. |
| 874 | * |
| 875 | * 1 2 3 4 5 6 |
| 876 | *0123456789012345678901234567890123456789012345678901234567890123456789 |
| 877 | *----- size -------|??????????????? MM-DD-YY| HH:MM| nnnnnnnnn.... |
| 878 | * 0 DIR 04-11-95 16:26 . |
| 879 | * 0 DIR 04-11-95 16:26 .. |
| 880 | * 0 DIR 04-11-95 16:26 ADDRESS |
| 881 | * 612 RHSA 07-28-95 16:45 air_tra1.bag |
| 882 | * 195 A 08-09-95 10:23 Alfa1.bag |
| 883 | * 0 RHS DIR 04-11-95 16:26 ATTACH |
| 884 | * 372 A 08-09-95 10:26 Aussie_1.bag |
| 885 | * 310992 06-28-94 09:56 INSTALL.EXE |
| 886 | * 1 2 3 4 |
| 887 | * 01234567890123456789012345678901234567890123456789 |
| 888 | * dirlist from the mirror.pl project, col positions from Mozilla. |
| 889 | */ |
| 890 | p = &(line[toklen[0]]); |
| 891 | /* \s(\d\d-\d\d-\d\d)\s+(\d\d:\d\d)\s */ |
| 892 | if (numtoks >= 4 && toklen[0] <= 18 && isASCIIDigit(*tokens[0]) && |
| 893 | (linelen - toklen[0]) >= (53-18) && |
| 894 | p[18-18] == ' ' && p[34-18] == ' ' && |
| 895 | p[37-18] == '-' && p[40-18] == '-' && p[43-18] == ' ' && |
| 896 | p[45-18] == ' ' && p[48-18] == ':' && p[51-18] == ' ' && |
| 897 | isASCIIDigit(p[35-18]) && isASCIIDigit(p[36-18]) && |
| 898 | isASCIIDigit(p[38-18]) && isASCIIDigit(p[39-18]) && |
| 899 | isASCIIDigit(p[41-18]) && isASCIIDigit(p[42-18]) && |
| 900 | isASCIIDigit(p[46-18]) && isASCIIDigit(p[47-18]) && |
| 901 | isASCIIDigit(p[49-18]) && isASCIIDigit(p[50-18]) |
| 902 | ) |
| 903 | { |
| 904 | lstyle = 'O'; /* OS/2 */ |
| 905 | if (!state.listStyle) |
| 906 | { |
| 907 | for (pos = 1; lstyle && pos < toklen[0]; pos++) |
| 908 | { |
| 909 | if (!isASCIIDigit(tokens[0][pos])) |
| 910 | lstyle = 0; |
| 911 | } |
| 912 | } |
| 913 | } |
| 914 | |
| 915 | if (lstyle == 'O') |
| 916 | { |
| 917 | state.parsedOne = true; |
| 918 | state.listStyle = lstyle; |
| 919 | |
| 920 | p = &(line[toklen[0]]); |
| 921 | |
| 922 | result.caseSensitive = true; |
| 923 | result.filename = &p[53-18]; |
| 924 | result.filenameLength = (&(line[linelen_sans_wsp])) |
| 925 | - (result.filename); |
| 926 | result.type = FTPFileEntry; |
| 927 | |
| 928 | /* I don't have a real listing to determine exact pos, so scan. */ |
| 929 | for (pos = (18-18); pos < ((35-18)-4); pos++) |
| 930 | { |
| 931 | if (p[pos+0] == ' ' && p[pos+1] == 'D' && |
| 932 | p[pos+2] == 'I' && p[pos+3] == 'R') |
| 933 | { |
| 934 | result.type = FTPDirectoryEntry; |
| 935 | break; |
| 936 | } |
| 937 | } |
| 938 | |
| 939 | if (result.type != FTPDirectoryEntry) |
| 940 | { |
| 941 | pos = toklen[0]; |
| 942 | result.fileSize = String(tokens[0], pos); |
| 943 | } |
| 944 | |
| 945 | result.modifiedTime.tm_mon = atoi(&p[35-18]) - 1; |
| 946 | result.modifiedTime.tm_mday = atoi(&p[38-18]); |
| 947 | result.modifiedTime.tm_year = atoi(&p[41-18]); |
| 948 | if (result.modifiedTime.tm_year < 80) |
| 949 | result.modifiedTime.tm_year += 100; |
| 950 | result.modifiedTime.tm_hour = atoi(&p[46-18]); |
| 951 | result.modifiedTime.tm_min = atoi(&p[49-18]); |
| 952 | |
| 953 | /* the caller should do this (if dropping "." and ".." is desired) |
| 954 | if (result.type == FTPDirectoryEntry && result.filename[0] == '.' && |
| 955 | (result.filenameLength == 1 || (result.filenameLength == 2 && |
| 956 | result.filename[1] == '.'))) |
| 957 | return FTPJunkEntry; |
| 958 | */ |
| 959 | |
| 960 | return result.type; |
| 961 | } /* if (lstyle == 'O') */ |
| 962 | |
| 963 | } /* if (!lstyle && (!state.listStyle || state.listStyle == 'O')) */ |
| 964 | #endif |
| 965 | |
| 966 | /* +++++++++++++++++++++++++++++++++++++++++++++++++++++++++++ */ |
| 967 | |
| 968 | #if defined(SUPPORT_LSL) |
| 969 | if (!lstyle && (!state.listStyle || state.listStyle == 'U')) /* /bin/ls & co. */ |
| 970 | { |
| 971 | /* UNIX-style listing, without inum and without blocks |
| 972 | * "-rw-r--r-- 1 root other 531 Jan 29 03:26 README" |
| 973 | * "dr-xr-xr-x 2 root other 512 Apr 8 1994 etc" |
| 974 | * "dr-xr-xr-x 2 root 512 Apr 8 1994 etc" |
| 975 | * "lrwxrwxrwx 1 root other 7 Jan 25 00:17 bin -> usr/bin" |
| 976 | * Also produced by Microsoft's FTP servers for Windows: |
| 977 | * "---------- 1 owner group 1803128 Jul 10 10:18 ls-lR.Z" |
| 978 | * "d--------- 1 owner group 0 May 9 19:45 Softlib" |
| 979 | * Also WFTPD for MSDOS: |
| 980 | * "-rwxrwxrwx 1 noone nogroup 322 Aug 19 1996 message.ftp" |
| 981 | * Hellsoft for NetWare: |
| 982 | * "d[RWCEMFA] supervisor 512 Jan 16 18:53 login" |
| 983 | * "-[RWCEMFA] rhesus 214059 Oct 20 15:27 cx.exe" |
| 984 | * Newer Hellsoft for NetWare: (netlab2.usu.edu) |
| 985 | * - [RWCEAFMS] NFAUUser 192 Apr 27 15:21 HEADER.html |
| 986 | * d [RWCEAFMS] jrd 512 Jul 11 03:01 allupdates |
| 987 | * Also NetPresenz for the Mac: |
| 988 | * "-------r-- 326 1391972 1392298 Nov 22 1995 MegaPhone.sit" |
| 989 | * "drwxrwxr-x folder 2 May 10 1996 network" |
| 990 | * Protected directory: |
| 991 | * "drwx-wx-wt 2 root wheel 512 Jul 1 02:15 incoming" |
| 992 | * uid/gid instead of username/groupname: |
| 993 | * "drwxr-xr-x 2 0 0 512 May 28 22:17 etc" |
| 994 | */ |
| 995 | |
| 996 | bool isOldHellsoft = false; |
| 997 | |
| 998 | if (numtoks >= 6) |
| 999 | { |
| 1000 | /* there are two perm formats (Hellsoft/NetWare and *IX strmode(3)). |
| 1001 | * Scan for size column only if the perm format is one or the other. |
| 1002 | */ |
| 1003 | if (toklen[0] == 1 || (tokens[0][1]) == '[') |
| 1004 | { |
| 1005 | if (*tokens[0] == 'd' || *tokens[0] == '-') |
| 1006 | { |
| 1007 | pos = toklen[0]-1; |
| 1008 | p = tokens[0] + 1; |
| 1009 | if (pos == 0) |
| 1010 | { |
| 1011 | p = tokens[1]; |
| 1012 | pos = toklen[1]; |
| 1013 | } |
| 1014 | if ((pos == 9 || pos == 10) && |
| 1015 | (*p == '[' && p[pos-1] == ']') && |
| 1016 | (p[1] == 'R' || p[1] == '-') && |
| 1017 | (p[2] == 'W' || p[2] == '-') && |
| 1018 | (p[3] == 'C' || p[3] == '-') && |
| 1019 | (p[4] == 'E' || p[4] == '-')) |
| 1020 | { |
| 1021 | /* rest is FMA[S] or AFM[S] */ |
| 1022 | lstyle = 'U'; /* very likely one of the NetWare servers */ |
| 1023 | if (toklen[0] == 10) |
| 1024 | isOldHellsoft = true; |
| 1025 | } |
| 1026 | } |
| 1027 | } |
| 1028 | else if ((toklen[0] == 10 || toklen[0] == 11) |
| 1029 | && strchr("-bcdlpsw?DFam" , *tokens[0])) |
| 1030 | { |
| 1031 | p = &(tokens[0][1]); |
| 1032 | if ((p[0] == 'r' || p[0] == '-') && |
| 1033 | (p[1] == 'w' || p[1] == '-') && |
| 1034 | (p[3] == 'r' || p[3] == '-') && |
| 1035 | (p[4] == 'w' || p[4] == '-') && |
| 1036 | (p[6] == 'r' || p[6] == '-') && |
| 1037 | (p[7] == 'w' || p[7] == '-')) |
| 1038 | /* 'x'/p[9] can be S|s|x|-|T|t or implementation specific */ |
| 1039 | { |
| 1040 | lstyle = 'U'; /* very likely /bin/ls */ |
| 1041 | } |
| 1042 | } |
| 1043 | } |
| 1044 | if (lstyle == 'U') /* first token checks out */ |
| 1045 | { |
| 1046 | lstyle = 0; |
| 1047 | for (pos = (numtoks-5); !lstyle && pos > 1; pos--) |
| 1048 | { |
| 1049 | /* scan for: (\d+)\s+([A-Z][a-z][a-z])\s+ |
| 1050 | * (\d\d\d\d|\d\:\d\d|\d\d\:\d\d|\d\:\d\d\:\d\d|\d\d\:\d\d\:\d\d) |
| 1051 | * \s+(.+)$ |
| 1052 | */ |
| 1053 | if (isASCIIDigit(*tokens[pos]) /* size */ |
| 1054 | /* (\w\w\w) */ |
| 1055 | && toklen[pos+1] == 3 && isASCIIAlpha(*tokens[pos+1]) && |
| 1056 | isASCIIAlpha(tokens[pos+1][1]) && isASCIIAlpha(tokens[pos+1][2]) |
| 1057 | /* (\d|\d\d) */ |
| 1058 | && isASCIIDigit(*tokens[pos+2]) && |
| 1059 | (toklen[pos+2] == 1 || |
| 1060 | (toklen[pos+2] == 2 && isASCIIDigit(tokens[pos+2][1]))) |
| 1061 | && toklen[pos+3] >= 4 && isASCIIDigit(*tokens[pos+3]) |
| 1062 | /* (\d\:\d\d\:\d\d|\d\d\:\d\d\:\d\d) */ |
| 1063 | && (toklen[pos+3] <= 5 || ( |
| 1064 | (toklen[pos+3] == 7 || toklen[pos+3] == 8) && |
| 1065 | (tokens[pos+3][toklen[pos+3]-3]) == ':')) |
| 1066 | && isASCIIDigit(tokens[pos+3][toklen[pos+3]-2]) |
| 1067 | && isASCIIDigit(tokens[pos+3][toklen[pos+3]-1]) |
| 1068 | && ( |
| 1069 | /* (\d\d\d\d) */ |
| 1070 | ((toklen[pos+3] == 4 || toklen[pos+3] == 5) && |
| 1071 | isASCIIDigit(tokens[pos+3][1]) && |
| 1072 | isASCIIDigit(tokens[pos+3][2]) ) |
| 1073 | /* (\d\:\d\d|\d\:\d\d\:\d\d) */ |
| 1074 | || ((toklen[pos+3] == 4 || toklen[pos+3] == 7) && |
| 1075 | (tokens[pos+3][1]) == ':' && |
| 1076 | isASCIIDigit(tokens[pos+3][2]) && isASCIIDigit(tokens[pos+3][3])) |
| 1077 | /* (\d\d\:\d\d|\d\d\:\d\d\:\d\d) */ |
| 1078 | || ((toklen[pos+3] == 5 || toklen[pos+3] == 8) && |
| 1079 | isASCIIDigit(tokens[pos+3][1]) && (tokens[pos+3][2]) == ':' && |
| 1080 | isASCIIDigit(tokens[pos+3][3]) && isASCIIDigit(tokens[pos+3][4])) |
| 1081 | ) |
| 1082 | ) |
| 1083 | { |
| 1084 | lstyle = 'U'; /* assume /bin/ls or variant format */ |
| 1085 | tokmarker = pos; |
| 1086 | |
| 1087 | /* check that size is numeric */ |
| 1088 | p = tokens[tokmarker]; |
| 1089 | for (unsigned int i = 0; lstyle && i < toklen[tokmarker]; ++i) |
| 1090 | { |
| 1091 | if (!isASCIIDigit(*p++)) |
| 1092 | lstyle = 0; |
| 1093 | } |
| 1094 | if (lstyle) |
| 1095 | { |
| 1096 | month_num = 0; |
| 1097 | p = tokens[tokmarker+1]; |
| 1098 | for (unsigned int i = 0; i < (12*3); i+=3) |
| 1099 | { |
| 1100 | if (p[0] == month_names[i+0] && |
| 1101 | p[1] == month_names[i+1] && |
| 1102 | p[2] == month_names[i+2]) |
| 1103 | break; |
| 1104 | month_num++; |
| 1105 | } |
| 1106 | if (month_num >= 12) |
| 1107 | lstyle = 0; |
| 1108 | } |
| 1109 | } /* relative position test */ |
| 1110 | } /* for (pos = (numtoks-5); !lstyle && pos > 1; pos--) */ |
| 1111 | } /* if (lstyle == 'U') */ |
| 1112 | |
| 1113 | if (lstyle == 'U') |
| 1114 | { |
| 1115 | state.parsedOne = true; |
| 1116 | state.listStyle = lstyle; |
| 1117 | |
| 1118 | result.caseSensitive = false; |
| 1119 | result.type = FTPJunkEntry; |
| 1120 | if (*tokens[0] == 'd' || *tokens[0] == 'D') |
| 1121 | result.type = FTPDirectoryEntry; |
| 1122 | else if (*tokens[0] == 'l') |
| 1123 | result.type = FTPLinkEntry; |
| 1124 | else if (*tokens[0] == '-' || *tokens[0] == 'F') |
| 1125 | result.type = FTPFileEntry; /* (hopefully a regular file) */ |
| 1126 | |
| 1127 | if (result.type != FTPDirectoryEntry) |
| 1128 | { |
| 1129 | pos = toklen[tokmarker]; |
| 1130 | result.fileSize = String(tokens[tokmarker], pos); |
| 1131 | } |
| 1132 | |
| 1133 | result.modifiedTime.tm_mon = month_num; |
| 1134 | result.modifiedTime.tm_mday = atoi(tokens[tokmarker+2]); |
| 1135 | if (result.modifiedTime.tm_mday == 0) |
| 1136 | result.modifiedTime.tm_mday++; |
| 1137 | |
| 1138 | p = tokens[tokmarker+3]; |
| 1139 | pos = (unsigned int)atoi(p); |
| 1140 | if (p[1] == ':') /* one digit hour */ |
| 1141 | p--; |
| 1142 | if (p[2] != ':') /* year */ |
| 1143 | { |
| 1144 | result.modifiedTime.tm_year = pos; |
| 1145 | } |
| 1146 | else |
| 1147 | { |
| 1148 | result.modifiedTime.tm_hour = pos; |
| 1149 | result.modifiedTime.tm_min = atoi(p+3); |
| 1150 | if (p[5] == ':') |
| 1151 | result.modifiedTime.tm_sec = atoi(p+6); |
| 1152 | |
| 1153 | if (!state.now) |
| 1154 | { |
| 1155 | time_t now = time(nullptr); |
| 1156 | state.now = now * 1000000.0; |
| 1157 | |
| 1158 | // FIXME: This code has the year 2038 bug |
| 1159 | gmtime_r(&now, &state.nowFTPTime); |
| 1160 | state.nowFTPTime.tm_year += 1900; |
| 1161 | } |
| 1162 | |
| 1163 | result.modifiedTime.tm_year = state.nowFTPTime.tm_year; |
| 1164 | if ( (( state.nowFTPTime.tm_mon << 5) + state.nowFTPTime.tm_mday) < |
| 1165 | ((result.modifiedTime.tm_mon << 5) + result.modifiedTime.tm_mday) ) |
| 1166 | result.modifiedTime.tm_year--; |
| 1167 | |
| 1168 | } /* time/year */ |
| 1169 | |
| 1170 | // there is exactly 1 space between filename and previous token in all |
| 1171 | // outputs except old Hellsoft |
| 1172 | if (!isOldHellsoft) |
| 1173 | result.filename = tokens[tokmarker+3] + toklen[tokmarker+3] + 1; |
| 1174 | else |
| 1175 | result.filename = tokens[tokmarker+4]; |
| 1176 | |
| 1177 | result.filenameLength = (&(line[linelen])) |
| 1178 | - (result.filename); |
| 1179 | |
| 1180 | if (result.type == FTPLinkEntry && result.filenameLength > 4) |
| 1181 | { |
| 1182 | /* First try to use result.fe_size to find " -> " sequence. |
| 1183 | This can give proper result for cases like "aaa -> bbb -> ccc". */ |
| 1184 | unsigned int fileSize = result.fileSize.toUInt(); |
| 1185 | |
| 1186 | if (result.filenameLength > (fileSize + 4) && |
| 1187 | strncmp(result.filename + result.filenameLength - fileSize - 4, " -> " , 4) == 0) |
| 1188 | { |
| 1189 | result.linkname = result.filename + (result.filenameLength - fileSize); |
| 1190 | result.linknameLength = (&(line[linelen])) - (result.linkname); |
| 1191 | result.filenameLength -= fileSize + 4; |
| 1192 | } |
| 1193 | else |
| 1194 | { |
| 1195 | /* Search for sequence " -> " from the end for case when there are |
| 1196 | more occurrences. F.e. if ftpd returns "a -> b -> c" assume |
| 1197 | "a -> b" as a name. Powerusers can remove unnecessary parts |
| 1198 | manually but there is no way to follow the link when some |
| 1199 | essential part is missing. */ |
| 1200 | p = result.filename + (result.filenameLength - 5); |
| 1201 | for (pos = (result.filenameLength - 5); pos > 0; pos--) |
| 1202 | { |
| 1203 | if (strncmp(p, " -> " , 4) == 0) |
| 1204 | { |
| 1205 | result.linkname = p + 4; |
| 1206 | result.linknameLength = (&(line[linelen])) |
| 1207 | - (result.linkname); |
| 1208 | result.filenameLength = pos; |
| 1209 | break; |
| 1210 | } |
| 1211 | p--; |
| 1212 | } |
| 1213 | } |
| 1214 | } |
| 1215 | |
| 1216 | #if defined(SUPPORT_LSLF) /* some (very rare) servers return ls -lF */ |
| 1217 | if (result.filenameLength > 1) |
| 1218 | { |
| 1219 | p = result.filename[result.filenameLength-1]; |
| 1220 | pos = result.type; |
| 1221 | if (pos == 'd') { |
| 1222 | if (*p == '/') result.filenameLength--; /* directory */ |
| 1223 | } else if (pos == 'l') { |
| 1224 | if (*p == '@') result.filenameLength--; /* symlink */ |
| 1225 | } else if (pos == 'f') { |
| 1226 | if (*p == '*') result.filenameLength--; /* executable */ |
| 1227 | } else if (*p == '=' || *p == '%' || *p == '|') { |
| 1228 | result.filenameLength--; /* socket, whiteout, fifo */ |
| 1229 | } |
| 1230 | } |
| 1231 | #endif |
| 1232 | |
| 1233 | /* the caller should do this (if dropping "." and ".." is desired) |
| 1234 | if (result.type == FTPDirectoryEntry && result.filename[0] == '.' && |
| 1235 | (result.filenameLength == 1 || (result.filenameLength == 2 && |
| 1236 | result.filename[1] == '.'))) |
| 1237 | return FTPJunkEntry; |
| 1238 | */ |
| 1239 | |
| 1240 | return result.type; |
| 1241 | |
| 1242 | } /* if (lstyle == 'U') */ |
| 1243 | |
| 1244 | } /* if (!lstyle && (!state.listStyle || state.listStyle == 'U')) */ |
| 1245 | #endif |
| 1246 | |
| 1247 | /* +++++++++++++++++++++++++++++++++++++++++++++++++++++++++++ */ |
| 1248 | |
| 1249 | #if defined(SUPPORT_W16) /* 16bit Windows */ |
| 1250 | if (!lstyle && (!state.listStyle || state.listStyle == 'w')) |
| 1251 | { /* old SuperTCP suite FTP server for Win3.1 */ |
| 1252 | /* old NetManage Chameleon TCP/IP suite FTP server for Win3.1 */ |
| 1253 | /* |
| 1254 | * SuperTCP dirlist from the mirror.pl project |
| 1255 | * mon/day/year separator may be '/' or '-'. |
| 1256 | * . <DIR> 11-16-94 17:16 |
| 1257 | * .. <DIR> 11-16-94 17:16 |
| 1258 | * INSTALL <DIR> 11-16-94 17:17 |
| 1259 | * CMT <DIR> 11-21-94 10:17 |
| 1260 | * DESIGN1.DOC 11264 05-11-95 14:20 |
| 1261 | * README.TXT 1045 05-10-95 11:01 |
| 1262 | * WPKIT1.EXE 960338 06-21-95 17:01 |
| 1263 | * CMT.CSV 0 07-06-95 14:56 |
| 1264 | * |
| 1265 | * Chameleon dirlist guessed from lynx |
| 1266 | * . <DIR> Nov 16 1994 17:16 |
| 1267 | * .. <DIR> Nov 16 1994 17:16 |
| 1268 | * INSTALL <DIR> Nov 16 1994 17:17 |
| 1269 | * CMT <DIR> Nov 21 1994 10:17 |
| 1270 | * DESIGN1.DOC 11264 May 11 1995 14:20 A |
| 1271 | * README.TXT 1045 May 10 1995 11:01 |
| 1272 | * WPKIT1.EXE 960338 Jun 21 1995 17:01 R |
| 1273 | * CMT.CSV 0 Jul 06 1995 14:56 RHA |
| 1274 | */ |
| 1275 | if (numtoks >= 4 && toklen[0] < 13 && |
| 1276 | ((toklen[1] == 5 && *tokens[1] == '<') || isASCIIDigit(*tokens[1])) ) |
| 1277 | { |
| 1278 | if (numtoks == 4 |
| 1279 | && (toklen[2] == 8 || toklen[2] == 9) |
| 1280 | && (((tokens[2][2]) == '/' && (tokens[2][5]) == '/') || |
| 1281 | ((tokens[2][2]) == '-' && (tokens[2][5]) == '-')) |
| 1282 | && (toklen[3] == 4 || toklen[3] == 5) |
| 1283 | && (tokens[3][toklen[3]-3]) == ':' |
| 1284 | && isASCIIDigit(tokens[2][0]) && isASCIIDigit(tokens[2][1]) |
| 1285 | && isASCIIDigit(tokens[2][3]) && isASCIIDigit(tokens[2][4]) |
| 1286 | && isASCIIDigit(tokens[2][6]) && isASCIIDigit(tokens[2][7]) |
| 1287 | && (toklen[2] < 9 || isASCIIDigit(tokens[2][8])) |
| 1288 | && isASCIIDigit(tokens[3][toklen[3]-1]) && isASCIIDigit(tokens[3][toklen[3]-2]) |
| 1289 | && isASCIIDigit(tokens[3][toklen[3]-4]) && isASCIIDigit(*tokens[3]) |
| 1290 | ) |
| 1291 | { |
| 1292 | lstyle = 'w'; |
| 1293 | } |
| 1294 | else if ((numtoks == 6 || numtoks == 7) |
| 1295 | && toklen[2] == 3 && toklen[3] == 2 |
| 1296 | && toklen[4] == 4 && toklen[5] == 5 |
| 1297 | && (tokens[5][2]) == ':' |
| 1298 | && isASCIIAlpha(tokens[2][0]) && isASCIIAlpha(tokens[2][1]) |
| 1299 | && isASCIIAlpha(tokens[2][2]) |
| 1300 | && isASCIIDigit(tokens[3][0]) && isASCIIDigit(tokens[3][1]) |
| 1301 | && isASCIIDigit(tokens[4][0]) && isASCIIDigit(tokens[4][1]) |
| 1302 | && isASCIIDigit(tokens[4][2]) && isASCIIDigit(tokens[4][3]) |
| 1303 | && isASCIIDigit(tokens[5][0]) && isASCIIDigit(tokens[5][1]) |
| 1304 | && isASCIIDigit(tokens[5][3]) && isASCIIDigit(tokens[5][4]) |
| 1305 | /* could also check that (&(tokens[5][5]) - tokens[2]) == 17 */ |
| 1306 | ) |
| 1307 | { |
| 1308 | lstyle = 'w'; |
| 1309 | } |
| 1310 | if (lstyle && state.listStyle != lstyle) /* first time */ |
| 1311 | { |
| 1312 | p = tokens[1]; |
| 1313 | if (toklen[1] != 5 || p[0] != '<' || p[1] != 'D' || |
| 1314 | p[2] != 'I' || p[3] != 'R' || p[4] != '>') |
| 1315 | { |
| 1316 | for (pos = 0; lstyle && pos < toklen[1]; pos++) |
| 1317 | { |
| 1318 | if (!isASCIIDigit(*p++)) |
| 1319 | lstyle = 0; |
| 1320 | } |
| 1321 | } /* not <DIR> */ |
| 1322 | } /* if (first time) */ |
| 1323 | } /* if (numtoks == ...) */ |
| 1324 | |
| 1325 | if (lstyle == 'w') |
| 1326 | { |
| 1327 | state.parsedOne = true; |
| 1328 | state.listStyle = lstyle; |
| 1329 | |
| 1330 | result.caseSensitive = true; |
| 1331 | result.filename = tokens[0]; |
| 1332 | result.filenameLength = toklen[0]; |
| 1333 | result.type = FTPDirectoryEntry; |
| 1334 | |
| 1335 | p = tokens[1]; |
| 1336 | if (isASCIIDigit(*p)) |
| 1337 | { |
| 1338 | result.type = FTPFileEntry; |
| 1339 | pos = toklen[1]; |
| 1340 | result.fileSize = String(p, pos); |
| 1341 | } |
| 1342 | |
| 1343 | p = tokens[2]; |
| 1344 | if (toklen[2] == 3) /* Chameleon */ |
| 1345 | { |
| 1346 | tbuf[0] = toASCIIUpper(p[0]); |
| 1347 | tbuf[1] = toASCIILower(p[1]); |
| 1348 | tbuf[2] = toASCIILower(p[2]); |
| 1349 | for (pos = 0; pos < (12*3); pos+=3) |
| 1350 | { |
| 1351 | if (tbuf[0] == month_names[pos+0] && |
| 1352 | tbuf[1] == month_names[pos+1] && |
| 1353 | tbuf[2] == month_names[pos+2]) |
| 1354 | { |
| 1355 | result.modifiedTime.tm_mon = pos/3; |
| 1356 | result.modifiedTime.tm_mday = atoi(tokens[3]); |
| 1357 | result.modifiedTime.tm_year = atoi(tokens[4]) - 1900; |
| 1358 | break; |
| 1359 | } |
| 1360 | } |
| 1361 | pos = 5; /* Chameleon toknum of date field */ |
| 1362 | } |
| 1363 | else |
| 1364 | { |
| 1365 | result.modifiedTime.tm_mon = atoi(p+0)-1; |
| 1366 | result.modifiedTime.tm_mday = atoi(p+3); |
| 1367 | result.modifiedTime.tm_year = atoi(p+6); |
| 1368 | if (result.modifiedTime.tm_year < 80) /* SuperTCP */ |
| 1369 | result.modifiedTime.tm_year += 100; |
| 1370 | |
| 1371 | pos = 3; /* SuperTCP toknum of date field */ |
| 1372 | } |
| 1373 | |
| 1374 | result.modifiedTime.tm_hour = atoi(tokens[pos]); |
| 1375 | result.modifiedTime.tm_min = atoi(&(tokens[pos][toklen[pos]-2])); |
| 1376 | |
| 1377 | /* the caller should do this (if dropping "." and ".." is desired) |
| 1378 | if (result.type == FTPDirectoryEntry && result.filename[0] == '.' && |
| 1379 | (result.filenameLength == 1 || (result.filenameLength == 2 && |
| 1380 | result.filename[1] == '.'))) |
| 1381 | return FTPJunkEntry; |
| 1382 | */ |
| 1383 | |
| 1384 | return result.type; |
| 1385 | } /* (lstyle == 'w') */ |
| 1386 | |
| 1387 | } /* if (!lstyle && (!state.listStyle || state.listStyle == 'w')) */ |
| 1388 | #endif |
| 1389 | |
| 1390 | /* +++++++++++++++++++++++++++++++++++++++++++++++++++++++++++ */ |
| 1391 | |
| 1392 | #if defined(SUPPORT_DLS) /* dls -dtR */ |
| 1393 | if (!lstyle && |
| 1394 | (state.listStyle == 'D' || (!state.listStyle && state.numLines == 1))) |
| 1395 | /* /bin/dls lines have to be immediately recognizable (first line) */ |
| 1396 | { |
| 1397 | /* I haven't seen an FTP server that delivers a /bin/dls listing, |
| 1398 | * but can infer the format from the lynx and mirror.pl projects. |
| 1399 | * Both formats are supported. |
| 1400 | * |
| 1401 | * Lynx says: |
| 1402 | * README 763 Information about this server\0 |
| 1403 | * bin/ - \0 |
| 1404 | * etc/ = \0 |
| 1405 | * ls-lR 0 \0 |
| 1406 | * ls-lR.Z 3 \0 |
| 1407 | * pub/ = Public area\0 |
| 1408 | * usr/ - \0 |
| 1409 | * morgan 14 -> ../real/morgan\0 |
| 1410 | * TIMIT.mostlikely.Z\0 |
| 1411 | * 79215 \0 |
| 1412 | * |
| 1413 | * mirror.pl says: |
| 1414 | * filename: ^(\S*)\s+ |
| 1415 | * size: (\-|\=|\d+)\s+ |
| 1416 | * month/day: ((\w\w\w\s+\d+|\d+\s+\w\w\w)\s+ |
| 1417 | * time/year: (\d+:\d+|\d\d\d\d))\s+ |
| 1418 | * rest: (.+) |
| 1419 | * |
| 1420 | * README 763 Jul 11 21:05 Information about this server |
| 1421 | * bin/ - Apr 28 1994 |
| 1422 | * etc/ = 11 Jul 21:04 |
| 1423 | * ls-lR 0 6 Aug 17:14 |
| 1424 | * ls-lR.Z 3 05 Sep 1994 |
| 1425 | * pub/ = Jul 11 21:04 Public area |
| 1426 | * usr/ - Sep 7 09:39 |
| 1427 | * morgan 14 Apr 18 09:39 -> ../real/morgan |
| 1428 | * TIMIT.mostlikely.Z |
| 1429 | * 79215 Jul 11 21:04 |
| 1430 | */ |
| 1431 | if (!state.listStyle && line[linelen-1] == ':' && |
| 1432 | linelen >= 2 && toklen[numtoks-1] != 1) |
| 1433 | { |
| 1434 | /* code in mirror.pl suggests that a listing may be preceded |
| 1435 | * by a PWD line in the form "/some/dir/names/here:" |
| 1436 | * but does not necessarily begin with '/'. *sigh* |
| 1437 | */ |
| 1438 | pos = 0; |
| 1439 | p = line; |
| 1440 | while (pos < (linelen-1)) |
| 1441 | { |
| 1442 | /* illegal (or extremely unusual) chars in a dirspec */ |
| 1443 | if (*p == '<' || *p == '|' || *p == '>' || |
| 1444 | *p == '?' || *p == '*' || *p == '\\') |
| 1445 | break; |
| 1446 | if (*p == '/' && pos < (linelen-2) && p[1] == '/') |
| 1447 | break; |
| 1448 | pos++; |
| 1449 | p++; |
| 1450 | } |
| 1451 | if (pos == (linelen-1)) |
| 1452 | { |
| 1453 | state.listStyle = 'D'; |
| 1454 | return FTPJunkEntry; |
| 1455 | } |
| 1456 | } |
| 1457 | |
| 1458 | if (!lstyle && numtoks >= 2) |
| 1459 | { |
| 1460 | pos = 22; /* pos of (\d+|-|=) if this is not part of a multiline */ |
| 1461 | if (state.listStyle && carry_buf_len) /* first is from previous line */ |
| 1462 | pos = toklen[1]-1; /* and is 'as-is' (may contain whitespace) */ |
| 1463 | |
| 1464 | if (linelen > pos) |
| 1465 | { |
| 1466 | p = &line[pos]; |
| 1467 | if ((*p == '-' || *p == '=' || isASCIIDigit(*p)) && |
| 1468 | ((linelen == (pos+1)) || |
| 1469 | (linelen >= (pos+3) && p[1] == ' ' && p[2] == ' ')) ) |
| 1470 | { |
| 1471 | tokmarker = 1; |
| 1472 | if (!carry_buf_len) |
| 1473 | { |
| 1474 | pos = 1; |
| 1475 | while (pos < numtoks && (tokens[pos]+toklen[pos]) < (&line[23])) |
| 1476 | pos++; |
| 1477 | tokmarker = 0; |
| 1478 | if ((tokens[pos]+toklen[pos]) == (&line[23])) |
| 1479 | tokmarker = pos; |
| 1480 | } |
| 1481 | if (tokmarker) |
| 1482 | { |
| 1483 | lstyle = 'D'; |
| 1484 | if (*tokens[tokmarker] == '-' || *tokens[tokmarker] == '=') |
| 1485 | { |
| 1486 | if (toklen[tokmarker] != 1 || |
| 1487 | (tokens[tokmarker-1][toklen[tokmarker-1]-1]) != '/') |
| 1488 | lstyle = 0; |
| 1489 | } |
| 1490 | else |
| 1491 | { |
| 1492 | for (pos = 0; lstyle && pos < toklen[tokmarker]; pos++) |
| 1493 | { |
| 1494 | if (!isASCIIDigit(tokens[tokmarker][pos])) |
| 1495 | lstyle = 0; |
| 1496 | } |
| 1497 | } |
| 1498 | if (lstyle && !state.listStyle) /* first time */ |
| 1499 | { |
| 1500 | /* scan for illegal (or incredibly unusual) chars in fname */ |
| 1501 | for (p = tokens[0]; lstyle && |
| 1502 | p < &(tokens[tokmarker-1][toklen[tokmarker-1]]); p++) |
| 1503 | { |
| 1504 | if (*p == '<' || *p == '|' || *p == '>' || |
| 1505 | *p == '?' || *p == '*' || *p == '/' || *p == '\\') |
| 1506 | lstyle = 0; |
| 1507 | } |
| 1508 | } |
| 1509 | |
| 1510 | } /* size token found */ |
| 1511 | } /* expected chars behind expected size token */ |
| 1512 | } /* if (linelen > pos) */ |
| 1513 | } /* if (!lstyle && numtoks >= 2) */ |
| 1514 | |
| 1515 | if (!lstyle && state.listStyle == 'D' && !carry_buf_len) |
| 1516 | { |
| 1517 | /* the filename of a multi-line entry can be identified |
| 1518 | * correctly only if dls format had been previously established. |
| 1519 | * This should always be true because there should be entries |
| 1520 | * for '.' and/or '..' and/or CWD that precede the rest of the |
| 1521 | * listing. |
| 1522 | */ |
| 1523 | pos = linelen; |
| 1524 | if (pos > (sizeof(state.carryBuffer)-1)) |
| 1525 | pos = sizeof(state.carryBuffer)-1; |
| 1526 | memcpy( state.carryBuffer, line, pos ); |
| 1527 | state.carryBufferLength = pos; |
| 1528 | return FTPJunkEntry; |
| 1529 | } |
| 1530 | |
| 1531 | if (lstyle == 'D') |
| 1532 | { |
| 1533 | state.parsedOne = true; |
| 1534 | state.listStyle = lstyle; |
| 1535 | |
| 1536 | p = &(tokens[tokmarker-1][toklen[tokmarker-1]]); |
| 1537 | result.filename = tokens[0]; |
| 1538 | result.filenameLength = p - tokens[0]; |
| 1539 | result.type = FTPFileEntry; |
| 1540 | |
| 1541 | if (result.filename[result.filenameLength-1] == '/') |
| 1542 | { |
| 1543 | if (result.linknameLength == 1) |
| 1544 | result.type = FTPJunkEntry; |
| 1545 | else |
| 1546 | { |
| 1547 | result.filenameLength--; |
| 1548 | result.type = FTPDirectoryEntry; |
| 1549 | } |
| 1550 | } |
| 1551 | else if (isASCIIDigit(*tokens[tokmarker])) |
| 1552 | { |
| 1553 | pos = toklen[tokmarker]; |
| 1554 | result.fileSize = String(tokens[tokmarker], pos); |
| 1555 | } |
| 1556 | |
| 1557 | if ((tokmarker+3) < numtoks && |
| 1558 | (&(tokens[numtoks-1][toklen[numtoks-1]]) - |
| 1559 | tokens[tokmarker+1]) >= (1+1+3+1+4) ) |
| 1560 | { |
| 1561 | pos = (tokmarker+3); |
| 1562 | p = tokens[pos]; |
| 1563 | pos = toklen[pos]; |
| 1564 | |
| 1565 | if ((pos == 4 || pos == 5) |
| 1566 | && isASCIIDigit(*p) && isASCIIDigit(p[pos-1]) && isASCIIDigit(p[pos-2]) |
| 1567 | && ((pos == 5 && p[2] == ':') || |
| 1568 | (pos == 4 && (isASCIIDigit(p[1]) || p[1] == ':'))) |
| 1569 | ) |
| 1570 | { |
| 1571 | month_num = tokmarker+1; /* assumed position of month field */ |
| 1572 | pos = tokmarker+2; /* assumed position of mday field */ |
| 1573 | if (isASCIIDigit(*tokens[month_num])) /* positions are reversed */ |
| 1574 | { |
| 1575 | month_num++; |
| 1576 | pos--; |
| 1577 | } |
| 1578 | p = tokens[month_num]; |
| 1579 | if (isASCIIDigit(*tokens[pos]) |
| 1580 | && (toklen[pos] == 1 || |
| 1581 | (toklen[pos] == 2 && isASCIIDigit(tokens[pos][1]))) |
| 1582 | && toklen[month_num] == 3 |
| 1583 | && isASCIIAlpha(*p) && isASCIIAlpha(p[1]) && isASCIIAlpha(p[2]) ) |
| 1584 | { |
| 1585 | pos = atoi(tokens[pos]); |
| 1586 | if (pos > 0 && pos <= 31) |
| 1587 | { |
| 1588 | result.modifiedTime.tm_mday = pos; |
| 1589 | month_num = 1; |
| 1590 | for (pos = 0; pos < (12*3); pos+=3) |
| 1591 | { |
| 1592 | if (p[0] == month_names[pos+0] && |
| 1593 | p[1] == month_names[pos+1] && |
| 1594 | p[2] == month_names[pos+2]) |
| 1595 | break; |
| 1596 | month_num++; |
| 1597 | } |
| 1598 | if (month_num > 12) |
| 1599 | result.modifiedTime.tm_mday = 0; |
| 1600 | else |
| 1601 | result.modifiedTime.tm_mon = month_num - 1; |
| 1602 | } |
| 1603 | } |
| 1604 | if (result.modifiedTime.tm_mday) |
| 1605 | { |
| 1606 | tokmarker += 3; /* skip mday/mon/yrtime (to find " -> ") */ |
| 1607 | p = tokens[tokmarker]; |
| 1608 | |
| 1609 | pos = atoi(p); |
| 1610 | if (pos > 24) |
| 1611 | result.modifiedTime.tm_year = pos-1900; |
| 1612 | else |
| 1613 | { |
| 1614 | if (p[1] == ':') |
| 1615 | p--; |
| 1616 | result.modifiedTime.tm_hour = pos; |
| 1617 | result.modifiedTime.tm_min = atoi(p+3); |
| 1618 | if (!state.now) |
| 1619 | { |
| 1620 | time_t now = time(nullptr); |
| 1621 | state.now = now * 1000000.0; |
| 1622 | |
| 1623 | // FIXME: This code has the year 2038 bug |
| 1624 | gmtime_r(&now, &state.nowFTPTime); |
| 1625 | state.nowFTPTime.tm_year += 1900; |
| 1626 | } |
| 1627 | result.modifiedTime.tm_year = state.nowFTPTime.tm_year; |
| 1628 | if ( (( state.nowFTPTime.tm_mon << 4) + state.nowFTPTime.tm_mday) < |
| 1629 | ((result.modifiedTime.tm_mon << 4) + result.modifiedTime.tm_mday) ) |
| 1630 | result.modifiedTime.tm_year--; |
| 1631 | } /* got year or time */ |
| 1632 | } /* got month/mday */ |
| 1633 | } /* may have year or time */ |
| 1634 | } /* enough remaining to possibly have date/time */ |
| 1635 | |
| 1636 | if (numtoks > (tokmarker+2)) |
| 1637 | { |
| 1638 | pos = tokmarker+1; |
| 1639 | p = tokens[pos]; |
| 1640 | if (toklen[pos] == 2 && *p == '-' && p[1] == '>') |
| 1641 | { |
| 1642 | p = &(tokens[numtoks-1][toklen[numtoks-1]]); |
| 1643 | result.type = FTPLinkEntry; |
| 1644 | result.linkname = tokens[pos+1]; |
| 1645 | result.linknameLength = p - result.linkname; |
| 1646 | if (result.linknameLength > 1 && |
| 1647 | result.linkname[result.linknameLength-1] == '/') |
| 1648 | result.linknameLength--; |
| 1649 | } |
| 1650 | } /* if (numtoks > (tokmarker+2)) */ |
| 1651 | |
| 1652 | /* the caller should do this (if dropping "." and ".." is desired) |
| 1653 | if (result.type == FTPDirectoryEntry && result.filename[0] == '.' && |
| 1654 | (result.filenameLength == 1 || (result.filenameLength == 2 && |
| 1655 | result.filename[1] == '.'))) |
| 1656 | return FTPJunkEntry; |
| 1657 | */ |
| 1658 | |
| 1659 | return result.type; |
| 1660 | |
| 1661 | } /* if (lstyle == 'D') */ |
| 1662 | } /* if (!lstyle && (!state.listStyle || state.listStyle == 'D')) */ |
| 1663 | #endif |
| 1664 | |
| 1665 | /* +++++++++++++++++++++++++++++++++++++++++++++++++++++++++++ */ |
| 1666 | |
| 1667 | } /* if (linelen > 0) */ |
| 1668 | |
| 1669 | return ParsingFailed(state); |
| 1670 | } |
| 1671 | |
| 1672 | } // namespace WebCore |
| 1673 | |
| 1674 | #endif // ENABLE(FTPDIR) |
| 1675 | |