123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770771772773774775776777778779780781782783784785786787788789790791792793794795796797798799800801802803804805806807808809810811812813814815816817818819820821822823824825826827828829830831832833834835836837838839840841842843844845846847848849850851852853854855856857858859860861862863864865866867868869870871872873874875876877878879880881882883884885 |
- /*
- Routines for parsing output from the 'ls' command.
- Copyright (C) 1988-2025
- Free Software Foundation, Inc.
- Copyright (C) 1995, 1996 Miguel de Icaza
- Written by:
- Miguel de Icaza, 1995, 1996
- Slava Zanko <slavazanko@gmail.com>, 2011
- This file is part of the Midnight Commander.
- The Midnight Commander is free software: you can redistribute it
- and/or modify it under the terms of the GNU General Public License as
- published by the Free Software Foundation, either version 3 of the License,
- or (at your option) any later version.
- The Midnight Commander is distributed in the hope that it will be useful,
- but WITHOUT ANY WARRANTY; without even the implied warranty of
- MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
- GNU General Public License for more details.
- You should have received a copy of the GNU General Public License
- along with this program. If not, see <http://www.gnu.org/licenses/>.
- */
- /**
- * \file
- * \brief Source: Utilities for VFS modules
- * \author Miguel de Icaza
- * \date 1995, 1996
- */
- #include <config.h>
- #include <ctype.h>
- #include <stdio.h>
- #include <stdlib.h>
- #include "lib/global.h"
- #include "lib/unixcompat.h" /* makedev */
- #include "lib/widget.h" /* message() */
- #include "utilvfs.h"
- /*** global variables ****************************************************************************/
- /*** file scope macro definitions ****************************************************************/
- /* Parsing code is used by ftpfs, shell and extfs */
- #define MAXCOLS 30
- /*** file scope type declarations ****************************************************************/
- /*** forward declarations (file scope functions) *************************************************/
- /*** file scope variables ************************************************************************/
- static char *columns[MAXCOLS]; /* Points to the string in column n */
- static int column_ptr[MAXCOLS]; /* Index from 0 to the starting positions of the columns */
- static size_t vfs_parse_ls_final_num_spaces = 0;
- /* --------------------------------------------------------------------------------------------- */
- /*** file scope functions ************************************************************************/
- /* --------------------------------------------------------------------------------------------- */
- static gboolean
- is_num (int idx)
- {
- char *column = columns[idx];
- return (column != NULL && isdigit (column[0]));
- }
- /* --------------------------------------------------------------------------------------------- */
- /* Return TRUE for MM-DD-YY and MM-DD-YYYY */
- static gboolean
- is_dos_date (const char *str)
- {
- size_t len;
- if (str == NULL)
- return FALSE;
- len = strlen (str);
- if (len != 8 && len != 10)
- return FALSE;
- if (str[2] != str[5])
- return FALSE;
- return (strchr ("\\-/", (int) str[2]) != NULL);
- }
- /* --------------------------------------------------------------------------------------------- */
- static gboolean
- is_week (const char *str, struct tm *tim)
- {
- static const char *week = "SunMonTueWedThuFriSat";
- const char *pos;
- if (str == NULL)
- return FALSE;
- pos = strstr (week, str);
- if (pos == NULL)
- return FALSE;
- if (tim != NULL)
- tim->tm_wday = (pos - week) / 3;
- return TRUE;
- }
- /* --------------------------------------------------------------------------------------------- */
- /**
- * Check for possible locale's abbreviated month name (Jan..Dec).
- * Any 3 bytes long string without digit, control and punctuation characters.
- * isalpha() is locale specific, so it cannot be used if current
- * locale is "C" and ftp server use Cyrillic.
- * NB: It is assumed there are no whitespaces in month.
- */
- static gboolean
- is_localized_month (const char *month)
- {
- int i;
- if (month == NULL)
- return FALSE;
- for (i = 0;
- i < 3 && *month != '\0' && !isdigit ((unsigned char) *month)
- && !iscntrl ((unsigned char) *month) && !ispunct ((unsigned char) *month); i++, month++)
- ;
- return (i == 3 && *month == '\0');
- }
- /* --------------------------------------------------------------------------------------------- */
- static gboolean
- is_time (const char *str, struct tm *tim)
- {
- const char *p, *p2;
- if (str == NULL)
- return FALSE;
- p = strchr (str, ':');
- if (p == NULL)
- return FALSE;
- p2 = strrchr (str, ':');
- if (p2 == NULL)
- return FALSE;
- if (p != p2)
- {
- if (sscanf (str, "%2d:%2d:%2d", &tim->tm_hour, &tim->tm_min, &tim->tm_sec) != 3)
- return FALSE;
- }
- else
- {
- if (sscanf (str, "%2d:%2d", &tim->tm_hour, &tim->tm_min) != 2)
- return FALSE;
- }
- return TRUE;
- }
- /* --------------------------------------------------------------------------------------------- */
- static gboolean
- is_year (char *str, struct tm *tim)
- {
- long year;
- if (str == NULL)
- return FALSE;
- if (strchr (str, ':') != NULL)
- return FALSE;
- if (strlen (str) != 4)
- return FALSE;
- /* cppcheck-suppress invalidscanf */
- if (sscanf (str, "%ld", &year) != 1)
- return FALSE;
- if (year < 1900 || year > 3000)
- return FALSE;
- tim->tm_year = (int) (year - 1900);
- return TRUE;
- }
- /* --------------------------------------------------------------------------------------------- */
- /*** public functions ****************************************************************************/
- /* --------------------------------------------------------------------------------------------- */
- gboolean
- vfs_parse_filetype (const char *s, size_t *ret_skipped, mode_t *ret_type)
- {
- mode_t type;
- switch (*s)
- {
- case 'd':
- type = S_IFDIR;
- break;
- case 'b':
- type = S_IFBLK;
- break;
- case 'c':
- type = S_IFCHR;
- break;
- case 'l':
- type = S_IFLNK;
- break;
- #ifdef S_IFSOCK
- case 's':
- type = S_IFSOCK;
- break;
- #else
- case 's':
- type = S_IFIFO;
- break;
- #endif
- #ifdef S_IFDOOR /* Solaris door */
- case 'D':
- type = S_IFDOOR;
- break;
- #else
- case 'D':
- type = S_IFIFO;
- break;
- #endif
- case 'p':
- type = S_IFIFO;
- break;
- #ifdef S_IFNAM /* Special named files */
- case 'n':
- type = S_IFNAM;
- break;
- #else
- case 'n':
- type = S_IFREG;
- break;
- #endif
- case 'm': /* Don't know what these are :-) */
- case '-':
- case '?':
- type = S_IFREG;
- break;
- default:
- return FALSE;
- }
- *ret_type = type;
- if (ret_skipped != NULL)
- *ret_skipped = 1;
- return TRUE;
- }
- /* --------------------------------------------------------------------------------------------- */
- gboolean
- vfs_parse_fileperms (const char *s, size_t *ret_skipped, mode_t *ret_perms)
- {
- const char *p = s;
- mode_t perms = 0;
- switch (*p++)
- {
- case '-':
- break;
- case 'r':
- perms |= S_IRUSR;
- break;
- default:
- return FALSE;
- }
- switch (*p++)
- {
- case '-':
- break;
- case 'w':
- perms |= S_IWUSR;
- break;
- default:
- return FALSE;
- }
- switch (*p++)
- {
- case '-':
- break;
- case 'S':
- perms |= S_ISUID;
- break;
- case 's':
- perms |= S_IXUSR | S_ISUID;
- break;
- case 'x':
- perms |= S_IXUSR;
- break;
- default:
- return FALSE;
- }
- switch (*p++)
- {
- case '-':
- break;
- case 'r':
- perms |= S_IRGRP;
- break;
- default:
- return FALSE;
- }
- switch (*p++)
- {
- case '-':
- break;
- case 'w':
- perms |= S_IWGRP;
- break;
- default:
- return FALSE;
- }
- switch (*p++)
- {
- case '-':
- break;
- case 'S':
- perms |= S_ISGID;
- break;
- case 'l':
- perms |= S_ISGID;
- break; /* found on Solaris */
- case 's':
- perms |= S_IXGRP | S_ISGID;
- break;
- case 'x':
- perms |= S_IXGRP;
- break;
- default:
- return FALSE;
- }
- switch (*p++)
- {
- case '-':
- break;
- case 'r':
- perms |= S_IROTH;
- break;
- default:
- return FALSE;
- }
- switch (*p++)
- {
- case '-':
- break;
- case 'w':
- perms |= S_IWOTH;
- break;
- default:
- return FALSE;
- }
- switch (*p++)
- {
- case '-':
- break;
- case 'T':
- perms |= S_ISVTX;
- break;
- case 't':
- perms |= S_IXOTH | S_ISVTX;
- break;
- case 'x':
- perms |= S_IXOTH;
- break;
- default:
- return FALSE;
- }
- if (*p == '+')
- /* ACLs on Solaris, HP-UX and others */
- p++;
- if (ret_skipped != NULL)
- *ret_skipped = p - s;
- *ret_perms = perms;
- return TRUE;
- }
- /* --------------------------------------------------------------------------------------------- */
- gboolean
- vfs_parse_filemode (const char *s, size_t *ret_skipped, mode_t *ret_mode)
- {
- const char *p = s;
- mode_t type, perms;
- size_t skipped;
- if (!vfs_parse_filetype (p, &skipped, &type))
- return FALSE;
- p += skipped;
- if (!vfs_parse_fileperms (p, &skipped, &perms))
- return FALSE;
- p += skipped;
- *ret_skipped = p - s;
- *ret_mode = type | perms;
- return TRUE;
- }
- /* --------------------------------------------------------------------------------------------- */
- gboolean
- vfs_parse_raw_filemode (const char *s, size_t *ret_skipped, mode_t *ret_mode)
- {
- const char *p = s;
- mode_t remote_type = 0, local_type, perms = 0;
- /* isoctal */
- for (; *p >= '0' && *p <= '7'; p++)
- {
- perms *= 010;
- perms += (*p - '0');
- }
- if (*p++ != ' ')
- return FALSE;
- for (; *p >= '0' && *p <= '7'; p++)
- {
- remote_type *= 010;
- remote_type += (*p - '0');
- }
- if (*p++ != ' ')
- return FALSE;
- /* generated with:
- $ perl -e 'use Fcntl ":mode";
- my @modes = (S_IFDIR, S_IFBLK, S_IFCHR, S_IFLNK, S_IFREG);
- foreach $t (@modes) { printf ("%o\n", $t); };'
- TODO: S_IFDOOR, S_IFIFO, S_IFSOCK (if supported by os)
- (see vfs_parse_filetype)
- */
- switch (remote_type)
- {
- case 020000:
- local_type = S_IFCHR;
- break;
- case 040000:
- local_type = S_IFDIR;
- break;
- case 060000:
- local_type = S_IFBLK;
- break;
- case 0120000:
- local_type = S_IFLNK;
- break;
- case 0100000:
- default: /* don't know what is it */
- local_type = S_IFREG;
- break;
- }
- *ret_skipped = p - s;
- *ret_mode = local_type | perms;
- return TRUE;
- }
- /* --------------------------------------------------------------------------------------------- */
- gboolean
- vfs_parse_month (const char *str, struct tm *tim)
- {
- static const char *month = "JanFebMarAprMayJunJulAugSepOctNovDec";
- const char *pos;
- if (str == NULL)
- return FALSE;
- pos = strstr (month, str);
- if (pos == NULL)
- return FALSE;
- if (tim != NULL)
- tim->tm_mon = (pos - month) / 3;
- return TRUE;
- }
- /* --------------------------------------------------------------------------------------------- */
- /** This function parses from idx in the columns[] array */
- int
- vfs_parse_filedate (int idx, time_t *t)
- {
- char *p;
- struct tm tim;
- int d[3];
- gboolean got_year = FALSE;
- gboolean l10n = FALSE; /* Locale's abbreviated month name */
- time_t current_time;
- struct tm *local_time;
- /* Let's setup default time values */
- current_time = time (NULL);
- local_time = localtime (¤t_time);
- tim.tm_mday = local_time->tm_mday;
- tim.tm_mon = local_time->tm_mon;
- tim.tm_year = local_time->tm_year;
- tim.tm_hour = 0;
- tim.tm_min = 0;
- tim.tm_sec = 0;
- tim.tm_isdst = -1; /* Let mktime() try to guess correct dst offset */
- p = columns[idx++];
- /* We eat weekday name in case of extfs */
- if (is_week (p, &tim))
- p = columns[idx++];
- /*
- ALLOWED DATE FORMATS
- We expect 3 fields max or we'll see oddities with certain file names.
- Formats that contain either year or time (the default 'ls' formats):
- * Mon DD hh:mm[:ss]
- * Mon DD YYYY
- Formats that contain both year and time, to make it easier to write
- extfs scripts:
- * MM-DD-YYYY hh:mm[:ss]
- * MM-DD-YY hh:mm[:ss]
- ('/' and '\' can be used instead of '-'.)
- where Mon is Jan-Dec, DD, MM, YY two digit day, month, year,
- YYYY four digit year, hh, mm, ss two digit hour, minute or second.
- (As for the "3 fields max" restriction: this prevents, for example, a
- file name "13:48" from being considered part of a "Sep 19 2016" date
- string preceding it.)
- */
- /* Month name */
- if (vfs_parse_month (p, &tim))
- {
- /* And we expect, it followed by day number */
- if (!is_num (idx))
- return 0; /* No day */
- tim.tm_mday = (int) atol (columns[idx++]);
- }
- else if (is_dos_date (p))
- {
- /* Case with MM-DD-YY or MM-DD-YYYY */
- p[2] = p[5] = '-';
- /* cppcheck-suppress invalidscanf */
- if (sscanf (p, "%2d-%2d-%d", &d[0], &d[1], &d[2]) != 3)
- return 0; /* sscanf failed */
- /* Months are zero based */
- if (d[0] > 0)
- d[0]--;
- if (d[2] > 1900)
- d[2] -= 1900;
- else if (d[2] < 70)
- /* Y2K madness */
- d[2] += 100;
- tim.tm_mon = d[0];
- tim.tm_mday = d[1];
- tim.tm_year = d[2];
- got_year = TRUE;
- }
- else if (is_localized_month (p) && is_num (idx++))
- /* Locale's abbreviated month name followed by day number */
- l10n = TRUE;
- else
- return 0; /* unsupported format */
- /* Here we expect to find time or year */
- if (!is_num (idx)
- || !(is_time (columns[idx], &tim) || (got_year = is_year (columns[idx], &tim))))
- return 0; /* Neither time nor date */
- idx++;
- /*
- * If the date is less than 6 months in the past, it is shown without year
- * other dates in the past or future are shown with year but without time
- * This does not check for years before 1900 ... I don't know, how
- * to represent them at all
- */
- if (!got_year && local_time->tm_mon < 6 && local_time->tm_mon < tim.tm_mon
- && tim.tm_mon - local_time->tm_mon >= 6)
- tim.tm_year--;
- *t = mktime (&tim);
- if (l10n || (*t < 0))
- *t = 0;
- return idx;
- }
- /* --------------------------------------------------------------------------------------------- */
- int
- vfs_split_text (char *p)
- {
- char *original = p;
- int numcols;
- memset (columns, 0, sizeof (columns));
- for (numcols = 0; *p != '\0' && numcols < MAXCOLS; numcols++)
- {
- for (; *p == ' ' || *p == '\r' || *p == '\n'; p++)
- *p = '\0';
- columns[numcols] = p;
- column_ptr[numcols] = p - original;
- for (; *p != '\0' && *p != ' ' && *p != '\r' && *p != '\n'; p++)
- ;
- }
- return numcols;
- }
- /* --------------------------------------------------------------------------------------------- */
- void
- vfs_parse_ls_lga_init (void)
- {
- vfs_parse_ls_final_num_spaces = 1;
- }
- /* --------------------------------------------------------------------------------------------- */
- size_t
- vfs_parse_ls_lga_get_final_spaces (void)
- {
- return vfs_parse_ls_final_num_spaces;
- }
- /* --------------------------------------------------------------------------------------------- */
- gboolean
- vfs_parse_ls_lga (const char *p, struct stat *s, char **filename, char **linkname,
- size_t *num_spaces)
- {
- int idx, idx2, num_cols;
- int i;
- char *p_copy = NULL;
- char *t = NULL;
- const char *line = p;
- size_t skipped;
- if (strncmp (p, "total", 5) == 0)
- return FALSE;
- if (!vfs_parse_filetype (p, &skipped, &s->st_mode))
- goto error;
- p += skipped;
- if (*p == ' ') /* Notwell 4 */
- p++;
- if (*p == '[')
- {
- if (strlen (p) <= 8 || p[8] != ']')
- goto error;
- /* Should parse here the Novell permissions :) */
- if (S_ISDIR (s->st_mode))
- s->st_mode |= (S_IRUSR | S_IRGRP | S_IROTH | S_IWUSR | S_IXUSR | S_IXGRP | S_IXOTH);
- else
- s->st_mode |= (S_IRUSR | S_IRGRP | S_IROTH | S_IWUSR);
- p += 9;
- }
- else
- {
- size_t lc_skipped;
- mode_t perms;
- if (!vfs_parse_fileperms (p, &lc_skipped, &perms))
- goto error;
- p += lc_skipped;
- s->st_mode |= perms;
- }
- p_copy = g_strdup (p);
- num_cols = vfs_split_text (p_copy);
- s->st_nlink = atol (columns[0]);
- if (s->st_nlink <= 0)
- goto error;
- if (!is_num (1))
- s->st_uid = vfs_finduid (columns[1]);
- else
- s->st_uid = (uid_t) atol (columns[1]);
- /* Mhm, the ls -lg did not produce a group field */
- for (idx = 3; idx <= 5; idx++)
- if (vfs_parse_month (columns[idx], NULL) || is_week (columns[idx], NULL)
- || is_dos_date (columns[idx]) || is_localized_month (columns[idx]))
- break;
- if (idx == 6 || (idx == 5 && !S_ISCHR (s->st_mode) && !S_ISBLK (s->st_mode)))
- goto error;
- /* We don't have gid */
- if (idx == 3 || (idx == 4 && (S_ISCHR (s->st_mode) || S_ISBLK (s->st_mode))))
- idx2 = 2;
- else
- {
- /* We have gid field */
- if (is_num (2))
- s->st_gid = (gid_t) atol (columns[2]);
- else
- s->st_gid = vfs_findgid (columns[2]);
- idx2 = 3;
- }
- /* This is device */
- if (S_ISCHR (s->st_mode) || S_ISBLK (s->st_mode))
- {
- int maj, min;
- /* Corner case: there is no whitespace(s) between maj & min */
- if (!is_num (idx2) && idx2 == 2)
- {
- /* cppcheck-suppress invalidscanf */
- if (!is_num (++idx2) || sscanf (columns[idx2], " %d,%d", &maj, &min) != 2)
- goto error;
- }
- else
- {
- /* cppcheck-suppress invalidscanf */
- if (!is_num (idx2) || sscanf (columns[idx2], " %d,", &maj) != 1)
- goto error;
- /* cppcheck-suppress invalidscanf */
- if (!is_num (++idx2) || sscanf (columns[idx2], " %d", &min) != 1)
- goto error;
- }
- #ifdef HAVE_STRUCT_STAT_ST_RDEV
- s->st_rdev = makedev (maj, min);
- #endif
- s->st_size = 0;
- }
- else
- {
- /* Common file size */
- if (!is_num (idx2))
- goto error;
- s->st_size = (off_t) g_ascii_strtoll (columns[idx2], NULL, 10);
- #ifdef HAVE_STRUCT_STAT_ST_RDEV
- s->st_rdev = 0;
- #endif
- }
- vfs_zero_stat_times (s);
- idx = vfs_parse_filedate (idx, &s->st_mtime);
- if (idx == 0)
- goto error;
- /* Use resulting time value */
- s->st_atime = s->st_ctime = s->st_mtime;
- /* s->st_dev and s->st_ino must be initialized by vfs_s_new_inode () */
- #ifdef HAVE_STRUCT_STAT_ST_BLKSIZE
- s->st_blksize = 512;
- #endif
- vfs_adjust_stat (s);
- if (num_spaces != NULL)
- {
- *num_spaces = column_ptr[idx] - column_ptr[idx - 1] - strlen (columns[idx - 1]);
- if (DIR_IS_DOTDOT (columns[idx]))
- vfs_parse_ls_final_num_spaces = *num_spaces;
- }
- for (i = idx + 1, idx2 = 0; i < num_cols; i++)
- if (strcmp (columns[i], "->") == 0)
- {
- idx2 = i;
- break;
- }
- if (((S_ISLNK (s->st_mode) || (num_cols == idx + 3 && s->st_nlink > 1))) /* Maybe a hardlink? (in extfs) */
- && idx2 != 0)
- {
- if (filename != NULL)
- *filename = g_strndup (p + column_ptr[idx], column_ptr[idx2] - column_ptr[idx] - 1);
- if (linkname != NULL)
- {
- t = g_strdup (p + column_ptr[idx2 + 1]);
- *linkname = t;
- }
- }
- else
- {
- /* Extract the filename from the string copy, not from the columns
- * this way we have a chance of entering hidden directories like ". ."
- */
- if (filename != NULL)
- {
- /* filename = g_strdup (columns [idx++]); */
- t = g_strdup (p + column_ptr[idx]);
- *filename = t;
- }
- if (linkname != NULL)
- *linkname = NULL;
- }
- if (t != NULL)
- {
- size_t p2;
- p2 = strlen (t);
- if (--p2 > 0 && (t[p2] == '\r' || t[p2] == '\n'))
- t[p2] = '\0';
- if (--p2 > 0 && (t[p2] == '\r' || t[p2] == '\n'))
- t[p2] = '\0';
- }
- g_free (p_copy);
- return TRUE;
- error:
- {
- static int errorcount = 0;
- if (++errorcount < 5)
- message (D_ERROR, _("Cannot parse:"), "%s",
- (p_copy != NULL && *p_copy != '\0') ? p_copy : line);
- else if (errorcount == 5)
- message (D_ERROR, MSG_ERROR, _("More parsing errors will be ignored."));
- }
- g_free (p_copy);
- return FALSE;
- }
- /* --------------------------------------------------------------------------------------------- */
|