parse.go 5.3 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235
  1. package ftp
  2. import (
  3. "errors"
  4. "strconv"
  5. "strings"
  6. "time"
  7. )
  8. var errUnsupportedListLine = errors.New("Unsupported LIST line")
  9. var listLineParsers = []func(line string) (*Entry, error){
  10. parseRFC3659ListLine,
  11. parseLsListLine,
  12. parseDirListLine,
  13. parseHostedFTPLine,
  14. }
  15. var dirTimeFormats = []string{
  16. "01-02-06 03:04PM",
  17. "2006-01-02 15:04",
  18. }
  19. // parseRFC3659ListLine parses the style of directory line defined in RFC 3659.
  20. func parseRFC3659ListLine(line string) (*Entry, error) {
  21. iSemicolon := strings.Index(line, ";")
  22. iWhitespace := strings.Index(line, " ")
  23. if iSemicolon < 0 || iSemicolon > iWhitespace {
  24. return nil, errUnsupportedListLine
  25. }
  26. e := &Entry{
  27. Name: line[iWhitespace+1:],
  28. }
  29. for _, field := range strings.Split(line[:iWhitespace-1], ";") {
  30. i := strings.Index(field, "=")
  31. if i < 1 {
  32. return nil, errUnsupportedListLine
  33. }
  34. key := strings.ToLower(field[:i])
  35. value := field[i+1:]
  36. switch key {
  37. case "modify":
  38. var err error
  39. e.Time, err = time.Parse("20060102150405", value)
  40. if err != nil {
  41. return nil, err
  42. }
  43. case "type":
  44. switch value {
  45. case "dir", "cdir", "pdir":
  46. e.Type = EntryTypeFolder
  47. case "file":
  48. e.Type = EntryTypeFile
  49. }
  50. case "size":
  51. e.setSize(value)
  52. }
  53. }
  54. return e, nil
  55. }
  56. // parseLsListLine parses a directory line in a format based on the output of
  57. // the UNIX ls command.
  58. func parseLsListLine(line string) (*Entry, error) {
  59. // Has the first field a length of 10 bytes?
  60. if strings.IndexByte(line, ' ') != 10 {
  61. return nil, errUnsupportedListLine
  62. }
  63. scanner := newScanner(line)
  64. fields := scanner.NextFields(6)
  65. if len(fields) < 6 {
  66. return nil, errUnsupportedListLine
  67. }
  68. if fields[1] == "folder" && fields[2] == "0" {
  69. e := &Entry{
  70. Type: EntryTypeFolder,
  71. Name: scanner.Remaining(),
  72. }
  73. if err := e.setTime(fields[3:6]); err != nil {
  74. return nil, err
  75. }
  76. return e, nil
  77. }
  78. if fields[1] == "0" {
  79. fields = append(fields, scanner.Next())
  80. e := &Entry{
  81. Type: EntryTypeFile,
  82. Name: scanner.Remaining(),
  83. }
  84. if err := e.setSize(fields[2]); err != nil {
  85. return nil, errUnsupportedListLine
  86. }
  87. if err := e.setTime(fields[4:7]); err != nil {
  88. return nil, err
  89. }
  90. return e, nil
  91. }
  92. // Read two more fields
  93. fields = append(fields, scanner.NextFields(2)...)
  94. if len(fields) < 8 {
  95. return nil, errUnsupportedListLine
  96. }
  97. e := &Entry{
  98. Name: scanner.Remaining(),
  99. }
  100. switch fields[0][0] {
  101. case '-':
  102. e.Type = EntryTypeFile
  103. if err := e.setSize(fields[4]); err != nil {
  104. return nil, err
  105. }
  106. case 'd':
  107. e.Type = EntryTypeFolder
  108. case 'l':
  109. e.Type = EntryTypeLink
  110. default:
  111. return nil, errors.New("Unknown entry type")
  112. }
  113. if err := e.setTime(fields[5:8]); err != nil {
  114. return nil, err
  115. }
  116. return e, nil
  117. }
  118. // parseDirListLine parses a directory line in a format based on the output of
  119. // the MS-DOS DIR command.
  120. func parseDirListLine(line string) (*Entry, error) {
  121. e := &Entry{}
  122. var err error
  123. // Try various time formats that DIR might use, and stop when one works.
  124. for _, format := range dirTimeFormats {
  125. if len(line) > len(format) {
  126. e.Time, err = time.Parse(format, line[:len(format)])
  127. if err == nil {
  128. line = line[len(format):]
  129. break
  130. }
  131. }
  132. }
  133. if err != nil {
  134. // None of the time formats worked.
  135. return nil, errUnsupportedListLine
  136. }
  137. line = strings.TrimLeft(line, " ")
  138. if strings.HasPrefix(line, "<DIR>") {
  139. e.Type = EntryTypeFolder
  140. line = strings.TrimPrefix(line, "<DIR>")
  141. } else {
  142. space := strings.Index(line, " ")
  143. if space == -1 {
  144. return nil, errUnsupportedListLine
  145. }
  146. e.Size, err = strconv.ParseUint(line[:space], 10, 64)
  147. if err != nil {
  148. return nil, errUnsupportedListLine
  149. }
  150. e.Type = EntryTypeFile
  151. line = line[space:]
  152. }
  153. e.Name = strings.TrimLeft(line, " ")
  154. return e, nil
  155. }
  156. // parseHostedFTPLine parses a directory line in the non-standard format used
  157. // by hostedftp.com
  158. // -r-------- 0 user group 65222236 Feb 24 00:39 UABlacklistingWeek8.csv
  159. // (The link count is inexplicably 0)
  160. func parseHostedFTPLine(line string) (*Entry, error) {
  161. // Has the first field a length of 10 bytes?
  162. if strings.IndexByte(line, ' ') != 10 {
  163. return nil, errUnsupportedListLine
  164. }
  165. scanner := newScanner(line)
  166. fields := scanner.NextFields(2)
  167. if len(fields) < 2 || fields[1] != "0" {
  168. return nil, errUnsupportedListLine
  169. }
  170. // Set link count to 1 and attempt to parse as Unix.
  171. return parseLsListLine(fields[0] + " 1 " + scanner.Remaining())
  172. }
  173. // parseListLine parses the various non-standard format returned by the LIST
  174. // FTP command.
  175. func parseListLine(line string) (*Entry, error) {
  176. for _, f := range listLineParsers {
  177. e, err := f(line)
  178. if err != errUnsupportedListLine {
  179. return e, err
  180. }
  181. }
  182. return nil, errUnsupportedListLine
  183. }
  184. func (e *Entry) setSize(str string) (err error) {
  185. e.Size, err = strconv.ParseUint(str, 0, 64)
  186. return
  187. }
  188. func (e *Entry) setTime(fields []string) (err error) {
  189. var timeStr string
  190. if strings.Contains(fields[2], ":") { // this year
  191. thisYear, _, _ := time.Now().Date()
  192. timeStr = fields[1] + " " + fields[0] + " " + strconv.Itoa(thisYear)[2:4] + " " + fields[2] + " GMT"
  193. } else { // not this year
  194. if len(fields[2]) != 4 {
  195. return errors.New("Invalid year format in time string")
  196. }
  197. timeStr = fields[1] + " " + fields[0] + " " + fields[2][2:4] + " 00:00 GMT"
  198. }
  199. e.Time, err = time.Parse("_2 Jan 06 15:04 MST", timeStr)
  200. return
  201. }