2016-12-31 17:32:31 +01:00
|
|
|
|
package ftp
|
|
|
|
|
|
|
|
|
|
import (
|
|
|
|
|
"errors"
|
2018-01-04 13:25:44 +01:00
|
|
|
|
"fmt"
|
2016-12-31 17:32:31 +01:00
|
|
|
|
"strconv"
|
|
|
|
|
"strings"
|
|
|
|
|
"time"
|
|
|
|
|
)
|
|
|
|
|
|
2019-01-22 14:50:39 +01:00
|
|
|
|
var errUnsupportedListLine = errors.New("unsupported LIST line")
|
2019-01-22 16:04:06 +01:00
|
|
|
|
var errUnsupportedListDate = errors.New("unsupported LIST date")
|
|
|
|
|
var errUnknownListEntryType = errors.New("unknown entry type")
|
2016-12-31 17:32:31 +01:00
|
|
|
|
|
2018-03-20 06:07:44 +01:00
|
|
|
|
type parseFunc func(string, time.Time, *time.Location) (*Entry, error)
|
2018-01-04 13:03:09 +01:00
|
|
|
|
|
|
|
|
|
var listLineParsers = []parseFunc{
|
2016-12-31 17:32:31 +01:00
|
|
|
|
parseRFC3659ListLine,
|
|
|
|
|
parseLsListLine,
|
|
|
|
|
parseDirListLine,
|
2017-07-06 02:55:11 +02:00
|
|
|
|
parseHostedFTPLine,
|
2023-06-29 18:58:13 +02:00
|
|
|
|
parseVMSFTPLine,
|
2016-12-31 17:32:31 +01:00
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
var dirTimeFormats = []string{
|
|
|
|
|
"01-02-06 03:04PM",
|
|
|
|
|
"2006-01-02 15:04",
|
|
|
|
|
}
|
|
|
|
|
|
2023-06-29 18:58:13 +02:00
|
|
|
|
// Empty string that saves the last string for VMS
|
|
|
|
|
var previousString = ""
|
|
|
|
|
|
|
|
|
|
func parseVMSFTPLine(s string, _ time.Time, location *time.Location) (*Entry, error) {
|
|
|
|
|
//If the string is empty, there are continuations on the next line(s)
|
|
|
|
|
if s == "" {
|
|
|
|
|
return nil, errUnsupportedListLine
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
scanner := newScanner(s)
|
|
|
|
|
filename := scanner.NextFields(1)[0]
|
|
|
|
|
|
|
|
|
|
// If the line does not contain a semicolon and there is nothing in previousString it is not a VMS FTP filename line
|
|
|
|
|
if !strings.Contains(filename, ";") && previousString == "" {
|
|
|
|
|
return nil, errUnsupportedListLine
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
remainingFields := scanner.NextFields(5)
|
|
|
|
|
|
|
|
|
|
// If there are no more fields then the current line has a continuation on the next line
|
|
|
|
|
if len(remainingFields) == 0 {
|
|
|
|
|
previousString = filename
|
|
|
|
|
return nil, errUnsupportedListLine
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
// If there is a previousString, then the current line is a continuation of the previous line
|
|
|
|
|
// Insert the current filename in remainingFields and set filename to previousString
|
|
|
|
|
if previousString != "" {
|
|
|
|
|
remainingFields = append([]string{filename}, remainingFields...)
|
|
|
|
|
filename = previousString
|
|
|
|
|
// Reset previousString
|
|
|
|
|
previousString = ""
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
if len(remainingFields) < 5 {
|
|
|
|
|
return nil, errUnsupportedListLine
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
entry := &Entry{}
|
|
|
|
|
// Files are formatted like this:
|
|
|
|
|
// FILENAME.EXT;1 123/125 12-DEC-2017 14:10:37 [GROUP,OWNER] (RWED,RWED,RE,)
|
|
|
|
|
// Directories are formatted like this:
|
|
|
|
|
// DIRECTORY.DIR;1 123/125 12-DEC-2017 14:10:37 [GROUP,OWNER] (RWED,RWED,RE,)
|
|
|
|
|
|
|
|
|
|
// Remove the version
|
|
|
|
|
parsedNameUnix := strings.Split(filename, ";")[0]
|
|
|
|
|
|
|
|
|
|
if strings.Contains(filename, ".DIR;") {
|
|
|
|
|
// Strip .DIR from parsedNameUnix
|
|
|
|
|
entry.Name = strings.Replace(parsedNameUnix, ".DIR", "", 1)
|
|
|
|
|
entry.Type = EntryTypeFolder
|
|
|
|
|
entry.Size = 0
|
|
|
|
|
} else {
|
|
|
|
|
entry.Name = parsedNameUnix
|
|
|
|
|
entry.Type = EntryTypeFile
|
|
|
|
|
// First number is the blocks used
|
|
|
|
|
parsedSize := strings.Split(remainingFields[0], "/")[0]
|
|
|
|
|
|
|
|
|
|
_ = entry.setSize(parsedSize)
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
// Parse the date
|
|
|
|
|
entry.Time, _ = time.ParseInLocation("_2-Jan-2006 15:04:05", remainingFields[1]+" "+remainingFields[2], location)
|
|
|
|
|
|
|
|
|
|
return entry, nil
|
|
|
|
|
}
|
|
|
|
|
|
2016-12-31 17:32:31 +01:00
|
|
|
|
// parseRFC3659ListLine parses the style of directory line defined in RFC 3659.
|
2022-08-21 23:25:29 +02:00
|
|
|
|
func parseRFC3659ListLine(line string, _ time.Time, loc *time.Location) (*Entry, error) {
|
|
|
|
|
return parseNextRFC3659ListLine(line, loc, &Entry{})
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
func parseNextRFC3659ListLine(line string, loc *time.Location, e *Entry) (*Entry, error) {
|
2016-12-31 17:32:31 +01:00
|
|
|
|
iSemicolon := strings.Index(line, ";")
|
|
|
|
|
iWhitespace := strings.Index(line, " ")
|
|
|
|
|
|
|
|
|
|
if iSemicolon < 0 || iSemicolon > iWhitespace {
|
|
|
|
|
return nil, errUnsupportedListLine
|
|
|
|
|
}
|
|
|
|
|
|
2022-08-21 23:25:29 +02:00
|
|
|
|
name := line[iWhitespace+1:]
|
|
|
|
|
if e.Name == "" {
|
|
|
|
|
e.Name = name
|
|
|
|
|
} else if e.Name != name {
|
|
|
|
|
// All lines must have the same name
|
|
|
|
|
return nil, errUnsupportedListLine
|
2016-12-31 17:32:31 +01:00
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
for _, field := range strings.Split(line[:iWhitespace-1], ";") {
|
|
|
|
|
i := strings.Index(field, "=")
|
|
|
|
|
if i < 1 {
|
|
|
|
|
return nil, errUnsupportedListLine
|
|
|
|
|
}
|
|
|
|
|
|
2017-09-27 01:33:03 +02:00
|
|
|
|
key := strings.ToLower(field[:i])
|
2016-12-31 17:32:31 +01:00
|
|
|
|
value := field[i+1:]
|
|
|
|
|
|
|
|
|
|
switch key {
|
|
|
|
|
case "modify":
|
|
|
|
|
var err error
|
2018-03-20 06:07:44 +01:00
|
|
|
|
e.Time, err = time.ParseInLocation("20060102150405", value, loc)
|
2016-12-31 17:32:31 +01:00
|
|
|
|
if err != nil {
|
|
|
|
|
return nil, err
|
|
|
|
|
}
|
|
|
|
|
case "type":
|
|
|
|
|
switch value {
|
|
|
|
|
case "dir", "cdir", "pdir":
|
|
|
|
|
e.Type = EntryTypeFolder
|
|
|
|
|
case "file":
|
|
|
|
|
e.Type = EntryTypeFile
|
|
|
|
|
}
|
|
|
|
|
case "size":
|
2021-03-07 01:36:26 +01:00
|
|
|
|
if err := e.setSize(value); err != nil {
|
|
|
|
|
return nil, err
|
|
|
|
|
}
|
2016-12-31 17:32:31 +01:00
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
return e, nil
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
// parseLsListLine parses a directory line in a format based on the output of
|
|
|
|
|
// the UNIX ls command.
|
2018-03-20 06:07:44 +01:00
|
|
|
|
func parseLsListLine(line string, now time.Time, loc *time.Location) (*Entry, error) {
|
2016-12-31 17:32:31 +01:00
|
|
|
|
|
2019-05-22 12:26:03 +02:00
|
|
|
|
// Has the first field a length of exactly 10 bytes
|
|
|
|
|
// - or 10 bytes with an additional '+' character for indicating ACLs?
|
|
|
|
|
// If not, return.
|
|
|
|
|
if i := strings.IndexByte(line, ' '); !(i == 10 || (i == 11 && line[10] == '+')) {
|
2016-12-31 17:32:31 +01:00
|
|
|
|
return nil, errUnsupportedListLine
|
|
|
|
|
}
|
|
|
|
|
|
2017-03-04 13:01:41 +01:00
|
|
|
|
scanner := newScanner(line)
|
2016-12-31 17:32:31 +01:00
|
|
|
|
fields := scanner.NextFields(6)
|
|
|
|
|
|
|
|
|
|
if len(fields) < 6 {
|
|
|
|
|
return nil, errUnsupportedListLine
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
if fields[1] == "folder" && fields[2] == "0" {
|
|
|
|
|
e := &Entry{
|
|
|
|
|
Type: EntryTypeFolder,
|
|
|
|
|
Name: scanner.Remaining(),
|
|
|
|
|
}
|
2018-03-20 06:07:44 +01:00
|
|
|
|
if err := e.setTime(fields[3:6], now, loc); err != nil {
|
2016-12-31 17:32:31 +01:00
|
|
|
|
return nil, err
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
return e, nil
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
if fields[1] == "0" {
|
|
|
|
|
fields = append(fields, scanner.Next())
|
|
|
|
|
e := &Entry{
|
|
|
|
|
Type: EntryTypeFile,
|
|
|
|
|
Name: scanner.Remaining(),
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
if err := e.setSize(fields[2]); err != nil {
|
2017-07-06 02:55:11 +02:00
|
|
|
|
return nil, errUnsupportedListLine
|
2016-12-31 17:32:31 +01:00
|
|
|
|
}
|
2018-03-20 06:07:44 +01:00
|
|
|
|
if err := e.setTime(fields[4:7], now, loc); err != nil {
|
2016-12-31 17:32:31 +01:00
|
|
|
|
return nil, err
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
return e, nil
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
// Read two more fields
|
|
|
|
|
fields = append(fields, scanner.NextFields(2)...)
|
|
|
|
|
if len(fields) < 8 {
|
|
|
|
|
return nil, errUnsupportedListLine
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
e := &Entry{
|
|
|
|
|
Name: scanner.Remaining(),
|
|
|
|
|
}
|
|
|
|
|
switch fields[0][0] {
|
|
|
|
|
case '-':
|
|
|
|
|
e.Type = EntryTypeFile
|
|
|
|
|
if err := e.setSize(fields[4]); err != nil {
|
|
|
|
|
return nil, err
|
|
|
|
|
}
|
|
|
|
|
case 'd':
|
|
|
|
|
e.Type = EntryTypeFolder
|
|
|
|
|
case 'l':
|
|
|
|
|
e.Type = EntryTypeLink
|
2019-06-24 10:49:00 +02:00
|
|
|
|
|
|
|
|
|
// Split link name and target
|
|
|
|
|
if i := strings.Index(e.Name, " -> "); i > 0 {
|
|
|
|
|
e.Target = e.Name[i+4:]
|
|
|
|
|
e.Name = e.Name[:i]
|
|
|
|
|
}
|
2016-12-31 17:32:31 +01:00
|
|
|
|
default:
|
2019-01-22 16:04:06 +01:00
|
|
|
|
return nil, errUnknownListEntryType
|
2016-12-31 17:32:31 +01:00
|
|
|
|
}
|
|
|
|
|
|
2018-03-20 06:07:44 +01:00
|
|
|
|
if err := e.setTime(fields[5:8], now, loc); err != nil {
|
2016-12-31 17:32:31 +01:00
|
|
|
|
return nil, err
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
return e, nil
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
// parseDirListLine parses a directory line in a format based on the output of
|
|
|
|
|
// the MS-DOS DIR command.
|
2023-06-29 18:58:13 +02:00
|
|
|
|
func parseDirListLine(line string, _ time.Time, loc *time.Location) (*Entry, error) {
|
2016-12-31 17:32:31 +01:00
|
|
|
|
e := &Entry{}
|
|
|
|
|
var err error
|
|
|
|
|
|
|
|
|
|
// Try various time formats that DIR might use, and stop when one works.
|
|
|
|
|
for _, format := range dirTimeFormats {
|
|
|
|
|
if len(line) > len(format) {
|
2018-03-20 06:07:44 +01:00
|
|
|
|
e.Time, err = time.ParseInLocation(format, line[:len(format)], loc)
|
2016-12-31 17:32:31 +01:00
|
|
|
|
if err == nil {
|
|
|
|
|
line = line[len(format):]
|
|
|
|
|
break
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
if err != nil {
|
|
|
|
|
// None of the time formats worked.
|
|
|
|
|
return nil, errUnsupportedListLine
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
line = strings.TrimLeft(line, " ")
|
|
|
|
|
if strings.HasPrefix(line, "<DIR>") {
|
|
|
|
|
e.Type = EntryTypeFolder
|
|
|
|
|
line = strings.TrimPrefix(line, "<DIR>")
|
|
|
|
|
} else {
|
|
|
|
|
space := strings.Index(line, " ")
|
|
|
|
|
if space == -1 {
|
|
|
|
|
return nil, errUnsupportedListLine
|
|
|
|
|
}
|
|
|
|
|
e.Size, err = strconv.ParseUint(line[:space], 10, 64)
|
|
|
|
|
if err != nil {
|
|
|
|
|
return nil, errUnsupportedListLine
|
|
|
|
|
}
|
|
|
|
|
e.Type = EntryTypeFile
|
|
|
|
|
line = line[space:]
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
e.Name = strings.TrimLeft(line, " ")
|
|
|
|
|
return e, nil
|
|
|
|
|
}
|
|
|
|
|
|
2017-07-06 02:55:11 +02:00
|
|
|
|
// parseHostedFTPLine parses a directory line in the non-standard format used
|
|
|
|
|
// by hostedftp.com
|
|
|
|
|
// -r-------- 0 user group 65222236 Feb 24 00:39 UABlacklistingWeek8.csv
|
|
|
|
|
// (The link count is inexplicably 0)
|
2018-03-20 06:07:44 +01:00
|
|
|
|
func parseHostedFTPLine(line string, now time.Time, loc *time.Location) (*Entry, error) {
|
2017-07-06 02:55:11 +02:00
|
|
|
|
// Has the first field a length of 10 bytes?
|
|
|
|
|
if strings.IndexByte(line, ' ') != 10 {
|
|
|
|
|
return nil, errUnsupportedListLine
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
scanner := newScanner(line)
|
2017-07-20 21:09:00 +02:00
|
|
|
|
fields := scanner.NextFields(2)
|
|
|
|
|
|
|
|
|
|
if len(fields) < 2 || fields[1] != "0" {
|
|
|
|
|
return nil, errUnsupportedListLine
|
2017-07-06 02:55:11 +02:00
|
|
|
|
}
|
|
|
|
|
|
2017-07-20 21:09:00 +02:00
|
|
|
|
// Set link count to 1 and attempt to parse as Unix.
|
2018-03-20 06:07:44 +01:00
|
|
|
|
return parseLsListLine(fields[0]+" 1 "+scanner.Remaining(), now, loc)
|
2017-07-06 02:55:11 +02:00
|
|
|
|
}
|
|
|
|
|
|
2016-12-31 17:32:31 +01:00
|
|
|
|
// parseListLine parses the various non-standard format returned by the LIST
|
|
|
|
|
// FTP command.
|
2018-03-20 06:07:44 +01:00
|
|
|
|
func parseListLine(line string, now time.Time, loc *time.Location) (*Entry, error) {
|
2016-12-31 17:32:31 +01:00
|
|
|
|
for _, f := range listLineParsers {
|
2018-03-20 06:07:44 +01:00
|
|
|
|
e, err := f(line, now, loc)
|
2016-12-31 17:32:31 +01:00
|
|
|
|
if err != errUnsupportedListLine {
|
|
|
|
|
return e, err
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
return nil, errUnsupportedListLine
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
func (e *Entry) setSize(str string) (err error) {
|
|
|
|
|
e.Size, err = strconv.ParseUint(str, 0, 64)
|
|
|
|
|
return
|
|
|
|
|
}
|
|
|
|
|
|
2018-03-20 06:07:44 +01:00
|
|
|
|
func (e *Entry) setTime(fields []string, now time.Time, loc *time.Location) (err error) {
|
2018-01-04 13:03:09 +01:00
|
|
|
|
if strings.Contains(fields[2], ":") { // contains time
|
|
|
|
|
thisYear, _, _ := now.Date()
|
2018-03-20 06:07:44 +01:00
|
|
|
|
timeStr := fmt.Sprintf("%s %s %d %s", fields[1], fields[0], thisYear, fields[2])
|
|
|
|
|
e.Time, err = time.ParseInLocation("_2 Jan 2006 15:04", timeStr, loc)
|
2018-01-04 13:03:09 +01:00
|
|
|
|
|
|
|
|
|
/*
|
|
|
|
|
On unix, `info ls` shows:
|
|
|
|
|
|
|
|
|
|
10.1.6 Formatting file timestamps
|
|
|
|
|
---------------------------------
|
|
|
|
|
|
|
|
|
|
A timestamp is considered to be “recent” if it is less than six
|
|
|
|
|
months old, and is not dated in the future. If a timestamp dated today
|
|
|
|
|
is not listed in recent form, the timestamp is in the future, which
|
|
|
|
|
means you probably have clock skew problems which may break programs
|
|
|
|
|
like ‘make’ that rely on file timestamps.
|
|
|
|
|
*/
|
|
|
|
|
if !e.Time.Before(now.AddDate(0, 6, 0)) {
|
|
|
|
|
e.Time = e.Time.AddDate(-1, 0, 0)
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
} else { // only the date
|
2016-12-31 17:32:31 +01:00
|
|
|
|
if len(fields[2]) != 4 {
|
2019-01-22 16:04:06 +01:00
|
|
|
|
return errUnsupportedListDate
|
2016-12-31 17:32:31 +01:00
|
|
|
|
}
|
2018-03-20 06:07:44 +01:00
|
|
|
|
timeStr := fmt.Sprintf("%s %s %s 00:00", fields[1], fields[0], fields[2])
|
|
|
|
|
e.Time, err = time.ParseInLocation("_2 Jan 2006 15:04", timeStr, loc)
|
2016-12-31 17:32:31 +01:00
|
|
|
|
}
|
|
|
|
|
return
|
|
|
|
|
}
|