OLD | NEW |
1 // Copyright (c) 2009 The Chromium Authors. All rights reserved. Use of this | 1 // Copyright (c) 2009 The Chromium Authors. All rights reserved. Use of this |
2 // source code is governed by a BSD-style license that can be found in the | 2 // source code is governed by a BSD-style license that can be found in the |
3 // LICENSE file. | 3 // LICENSE file. |
4 | 4 |
5 #include "net/ftp/ftp_directory_listing_parsers.h" | 5 #include "net/ftp/ftp_directory_listing_parsers.h" |
6 | 6 |
7 #include "base/string_util.h" | 7 #include "base/string_util.h" |
8 | 8 |
9 namespace { | 9 namespace { |
10 | 10 |
11 bool LooksLikeUnixPermission(const string16& text) { | 11 bool LooksLikeUnixPermission(const string16& text) { |
12 if (text.length() != 3) | 12 if (text.length() != 3) |
13 return false; | 13 return false; |
14 | 14 |
15 return ((text[0] == 'r' || text[0] == '-') && | 15 return ((text[0] == 'r' || text[0] == '-') && |
16 (text[1] == 'w' || text[1] == '-') && | 16 (text[1] == 'w' || text[1] == '-') && |
17 (text[2] == 'x' || text[2] == 's' || text[2] == 'S' || | 17 (text[2] == 'x' || text[2] == 's' || text[2] == 'S' || |
18 text[2] == '-')); | 18 text[2] == '-')); |
19 } | 19 } |
20 | 20 |
21 bool LooksLikeUnixPermissionsListing(const string16& text) { | 21 bool LooksLikeUnixPermissionsListing(const string16& text) { |
22 if (text.length() != 10) | 22 if (text.length() != 10) |
23 return false; | 23 return false; |
24 | 24 |
25 if (text[0] != 'b' && text[0] != 'c' && text[0] != 'd' && | 25 if (text[0] != 'b' && text[0] != 'c' && text[0] != 'd' && |
26 text[0] != 'l' && text[0] != 'p' && text[0] != 's' && | 26 text[0] != 'l' && text[0] != 'p' && text[0] != 's' && |
27 text[0] != '-') | 27 text[0] != '-') |
28 return false; | 28 return false; |
29 | 29 |
30 return (LooksLikeUnixPermission(text.substr(1, 3)) && | 30 return (LooksLikeUnixPermission(text.substr(1, 3)) && |
31 LooksLikeUnixPermission(text.substr(4, 3)) && | 31 LooksLikeUnixPermission(text.substr(4, 3)) && |
32 LooksLikeUnixPermission(text.substr(7, 3))); | 32 LooksLikeUnixPermission(text.substr(7, 3))); |
33 } | 33 } |
34 | 34 |
35 bool IsStringNonNegativeNumber(const string16& text) { | 35 bool IsStringNonNegativeInteger(const string16& text) { |
36 int number; | 36 int number; |
37 if (!StringToInt(text, &number)) | 37 if (!StringToInt(text, &number)) |
38 return false; | 38 return false; |
39 | 39 |
40 return number >= 0; | 40 return number >= 0; |
41 } | 41 } |
42 | 42 |
43 bool ThreeLetterMonthToNumber(const string16& text, int* number) { | 43 bool ThreeLetterMonthToNumber(const string16& text, int* number) { |
44 const static char* months[] = { "jan", "feb", "mar", "apr", "may", "jun", | 44 const static char* months[] = { "jan", "feb", "mar", "apr", "may", "jun", |
45 "jul", "aug", "sep", "oct", "nov", "dec" }; | 45 "jul", "aug", "sep", "oct", "nov", "dec" }; |
46 | 46 |
47 for (size_t i = 0; i < arraysize(months); i++) { | 47 for (size_t i = 0; i < arraysize(months); i++) { |
48 if (LowerCaseEqualsASCII(text, months[i])) { | 48 if (LowerCaseEqualsASCII(text, months[i])) { |
49 *number = i + 1; | 49 *number = i + 1; |
50 return true; | 50 return true; |
51 } | 51 } |
52 } | 52 } |
53 | 53 |
54 return false; | 54 return false; |
55 } | 55 } |
56 | 56 |
57 bool UnixDateListingToTime(const std::vector<string16>& columns, | 57 bool UnixDateListingToTime(const std::vector<string16>& columns, |
58 base::Time* time) { | 58 base::Time* time) { |
59 DCHECK_EQ(9U, columns.size()); | 59 DCHECK_EQ(9U, columns.size()); |
60 | 60 |
61 base::Time::Exploded time_exploded = { 0 }; | 61 base::Time::Exploded time_exploded = { 0 }; |
62 | 62 |
63 if (!ThreeLetterMonthToNumber(columns[5], &time_exploded.month)) | 63 if (!ThreeLetterMonthToNumber(columns[5], &time_exploded.month)) |
64 return false; | 64 return false; |
65 | 65 |
66 if (!StringToInt(columns[6], &time_exploded.day_of_month)) | 66 if (!StringToInt(columns[6], &time_exploded.day_of_month)) |
67 return false; | 67 return false; |
68 | 68 |
69 if (!StringToInt(columns[7], &time_exploded.year)) { | 69 if (!StringToInt(columns[7], &time_exploded.year)) { |
70 // Maybe it's time. Does it look like time (MM:HH)? | 70 // Maybe it's time. Does it look like time (MM:HH)? |
71 if (columns[7].length() != 5 || columns[7][2] != ':') | 71 if (columns[7].length() != 5 || columns[7][2] != ':') |
72 return false; | 72 return false; |
73 | 73 |
74 if (!StringToInt(columns[7].substr(0, 2), &time_exploded.hour)) | 74 if (!StringToInt(columns[7].substr(0, 2), &time_exploded.hour)) |
75 return false; | 75 return false; |
76 | 76 |
77 if (!StringToInt(columns[7].substr(3, 2), &time_exploded.minute)) | 77 if (!StringToInt(columns[7].substr(3, 2), &time_exploded.minute)) |
78 return false; | 78 return false; |
79 | 79 |
80 // Use current year. | 80 // Use current year. |
81 base::Time::Exploded now_exploded; | 81 base::Time::Exploded now_exploded; |
82 base::Time::Now().LocalExplode(&now_exploded); | 82 base::Time::Now().LocalExplode(&now_exploded); |
83 time_exploded.year = now_exploded.year; | 83 time_exploded.year = now_exploded.year; |
84 } | 84 } |
85 | 85 |
86 // We don't know the time zone of the server, so just use local time. | 86 // We don't know the time zone of the server, so just use local time. |
87 *time = base::Time::FromLocalExploded(time_exploded); | 87 *time = base::Time::FromLocalExploded(time_exploded); |
88 return true; | 88 return true; |
89 } | 89 } |
90 | 90 |
| 91 // Converts the filename component in listing to the filename we can display. |
| 92 // Returns true on success. |
| 93 bool ParseVmsFilename(const string16& raw_filename, string16* parsed_filename, |
| 94 bool* is_directory) { |
| 95 // On VMS, the files and directories are versioned. The version number is |
| 96 // separated from the file name by a semicolon. Example: ANNOUNCE.TXT;2. |
| 97 std::vector<string16> listing_parts; |
| 98 SplitString(raw_filename, ';', &listing_parts); |
| 99 if (listing_parts.size() != 2) |
| 100 return false; |
| 101 if (!IsStringNonNegativeInteger(listing_parts[1])) |
| 102 return false; |
| 103 |
| 104 // Even directories have extensions in the listings. Don't display extensions |
| 105 // for directories; it's awkward for non-VMS users. Also, VMS is |
| 106 // case-insensitive, but generally uses uppercase characters. This may look |
| 107 // awkward, so we convert them to lower case. |
| 108 std::vector<string16> filename_parts; |
| 109 SplitString(listing_parts[0], '.', &filename_parts); |
| 110 if (filename_parts.size() != 2) |
| 111 return false; |
| 112 if (filename_parts[1] == ASCIIToUTF16("DIR")) { |
| 113 *parsed_filename = StringToLowerASCII(filename_parts[0]); |
| 114 *is_directory = true; |
| 115 } else { |
| 116 *parsed_filename = StringToLowerASCII(listing_parts[0]); |
| 117 *is_directory = false; |
| 118 } |
| 119 return true; |
| 120 } |
| 121 |
| 122 bool ParseVmsFilesize(const string16& input, int64* size) { |
| 123 // VMS's directory listing gives us file size in blocks. We assume that |
| 124 // the block size is 512 bytes. It doesn't give accurate file size, but is the |
| 125 // best information we have. |
| 126 const int kBlockSize = 512; |
| 127 |
| 128 if (StringToInt64(input, size)) { |
| 129 *size *= kBlockSize; |
| 130 return true; |
| 131 } |
| 132 |
| 133 std::vector<string16> parts; |
| 134 SplitString(input, '/', &parts); |
| 135 if (parts.size() != 2) |
| 136 return false; |
| 137 |
| 138 int64 blocks_used, blocks_allocated; |
| 139 if (!StringToInt64(parts[0], &blocks_used)) |
| 140 return false; |
| 141 if (!StringToInt64(parts[1], &blocks_allocated)) |
| 142 return false; |
| 143 if (blocks_used > blocks_allocated) |
| 144 return false; |
| 145 |
| 146 *size = blocks_used * kBlockSize; |
| 147 return true; |
| 148 } |
| 149 |
| 150 bool LooksLikeVmsFileProtectionListingPart(const string16& input) { |
| 151 if (input.length() > 4) |
| 152 return false; |
| 153 |
| 154 // On VMS there are four different permission bits: Read, Write, Execute, |
| 155 // and Delete. They appear in that order in the permission listing. |
| 156 std::string pattern("RWED"); |
| 157 string16 match(input); |
| 158 while (!match.empty() && !pattern.empty()) { |
| 159 if (match[0] == pattern[0]) |
| 160 match = match.substr(1); |
| 161 pattern = pattern.substr(1); |
| 162 } |
| 163 return match.empty(); |
| 164 } |
| 165 |
| 166 bool LooksLikeVmsFileProtectionListing(const string16& input) { |
| 167 if (input.length() < 2) |
| 168 return false; |
| 169 if (input[0] != '(' || input[input.length() - 1] != ')') |
| 170 return false; |
| 171 |
| 172 // We expect four parts of the file protection listing: for System, Owner, |
| 173 // Group, and World. |
| 174 std::vector<string16> parts; |
| 175 SplitString(input.substr(1, input.length() - 2), ',', &parts); |
| 176 if (parts.size() != 4) |
| 177 return false; |
| 178 |
| 179 return LooksLikeVmsFileProtectionListingPart(parts[0]) && |
| 180 LooksLikeVmsFileProtectionListingPart(parts[1]) && |
| 181 LooksLikeVmsFileProtectionListingPart(parts[2]) && |
| 182 LooksLikeVmsFileProtectionListingPart(parts[3]); |
| 183 } |
| 184 |
| 185 bool LooksLikeVmsUserIdentificationCode(const string16& input) { |
| 186 if (input.length() < 2) |
| 187 return false; |
| 188 return input[0] == '[' && input[input.length() - 1] == ']'; |
| 189 } |
| 190 |
| 191 bool VmsDateListingToTime(const std::vector<string16>& columns, |
| 192 base::Time* time) { |
| 193 DCHECK_EQ(3U, columns.size()); |
| 194 |
| 195 base::Time::Exploded time_exploded = { 0 }; |
| 196 |
| 197 // Date should be in format DD-MMM-YYYY. |
| 198 std::vector<string16> date_parts; |
| 199 SplitString(columns[1], '-', &date_parts); |
| 200 if (date_parts.size() != 3) |
| 201 return false; |
| 202 if (!StringToInt(date_parts[0], &time_exploded.day_of_month)) |
| 203 return false; |
| 204 if (!ThreeLetterMonthToNumber(date_parts[1], &time_exploded.month)) |
| 205 return false; |
| 206 if (!StringToInt(date_parts[2], &time_exploded.year)) |
| 207 return false; |
| 208 |
| 209 // Time can be in format HH:MM, HH:MM:SS, or HH:MM:SS.mm. Try to recognize the |
| 210 // last type first. Do not parse the seconds, they will be ignored anyway. |
| 211 string16 time_column(columns[2]); |
| 212 if (time_column.length() == 11 && time_column[8] == '.') |
| 213 time_column = time_column.substr(0, 8); |
| 214 if (time_column.length() == 8 && time_column[5] == ':') |
| 215 time_column = time_column.substr(0, 5); |
| 216 if (time_column.length() != 5) |
| 217 return false; |
| 218 std::vector<string16> time_parts; |
| 219 SplitString(time_column, ':', &time_parts); |
| 220 if (time_parts.size() != 2) |
| 221 return false; |
| 222 if (!StringToInt(time_parts[0], &time_exploded.hour)) |
| 223 return false; |
| 224 if (!StringToInt(time_parts[1], &time_exploded.minute)) |
| 225 return false; |
| 226 |
| 227 // We don't know the time zone of the server, so just use local time. |
| 228 *time = base::Time::FromLocalExploded(time_exploded); |
| 229 return true; |
| 230 } |
| 231 |
91 } // namespace | 232 } // namespace |
92 | 233 |
93 namespace net { | 234 namespace net { |
94 | 235 |
95 FtpDirectoryListingParser::~FtpDirectoryListingParser() { | 236 FtpDirectoryListingParser::~FtpDirectoryListingParser() { |
96 } | 237 } |
97 | 238 |
98 FtpLsDirectoryListingParser::FtpLsDirectoryListingParser() { | 239 FtpLsDirectoryListingParser::FtpLsDirectoryListingParser() { |
99 } | 240 } |
100 | 241 |
101 bool FtpLsDirectoryListingParser::ConsumeLine(const string16& line) { | 242 bool FtpLsDirectoryListingParser::ConsumeLine(const string16& line) { |
102 std::vector<string16> columns; | 243 std::vector<string16> columns; |
103 SplitString(CollapseWhitespace(line, false), ' ', &columns); | 244 SplitString(CollapseWhitespace(line, false), ' ', &columns); |
104 if (columns.size() == 11) { | 245 if (columns.size() == 11) { |
105 // Check if it is a symlink. | 246 // Check if it is a symlink. |
106 if (columns[9] != ASCIIToUTF16("->")) | 247 if (columns[9] != ASCIIToUTF16("->")) |
107 return false; | 248 return false; |
108 | 249 |
109 // Drop the symlink target from columns, we don't use it. | 250 // Drop the symlink target from columns, we don't use it. |
110 columns.resize(9); | 251 columns.resize(9); |
111 } | 252 } |
112 | 253 |
113 if (columns.size() != 9) | 254 if (columns.size() != 9) |
114 return false; | 255 return false; |
115 | 256 |
116 if (!LooksLikeUnixPermissionsListing(columns[0])) | 257 if (!LooksLikeUnixPermissionsListing(columns[0])) |
117 return false; | 258 return false; |
118 | 259 |
119 FtpDirectoryListingEntry entry; | 260 FtpDirectoryListingEntry entry; |
120 if (columns[0][0] == 'l') { | 261 if (columns[0][0] == 'l') { |
121 entry.type = FtpDirectoryListingEntry::SYMLINK; | 262 entry.type = FtpDirectoryListingEntry::SYMLINK; |
122 } else if (columns[0][0] == 'd') { | 263 } else if (columns[0][0] == 'd') { |
123 entry.type = FtpDirectoryListingEntry::DIRECTORY; | 264 entry.type = FtpDirectoryListingEntry::DIRECTORY; |
124 } else { | 265 } else { |
125 entry.type = FtpDirectoryListingEntry::FILE; | 266 entry.type = FtpDirectoryListingEntry::FILE; |
126 } | 267 } |
127 | 268 |
128 if (!IsStringNonNegativeNumber(columns[1])) | 269 if (!IsStringNonNegativeInteger(columns[1])) |
129 return false; | 270 return false; |
130 | 271 |
131 if (!StringToInt64(columns[4], &entry.size)) | 272 if (!StringToInt64(columns[4], &entry.size)) |
132 return false; | 273 return false; |
133 if (entry.size < 0) | 274 if (entry.size < 0) |
134 return false; | 275 return false; |
135 if (entry.type != FtpDirectoryListingEntry::FILE) | 276 if (entry.type != FtpDirectoryListingEntry::FILE) |
136 entry.size = -1; | 277 entry.size = -1; |
137 | 278 |
138 if (!UnixDateListingToTime(columns, &entry.last_modified)) | 279 if (!UnixDateListingToTime(columns, &entry.last_modified)) |
139 return false; | 280 return false; |
140 | 281 |
141 entry.name = columns[8]; | 282 entry.name = columns[8]; |
142 | 283 |
143 entries_.push(entry); | 284 entries_.push(entry); |
144 return true; | 285 return true; |
145 } | 286 } |
146 | 287 |
147 bool FtpLsDirectoryListingParser::EntryAvailable() const { | 288 bool FtpLsDirectoryListingParser::EntryAvailable() const { |
148 return !entries_.empty(); | 289 return !entries_.empty(); |
149 } | 290 } |
150 | 291 |
151 FtpDirectoryListingEntry FtpLsDirectoryListingParser::PopEntry() { | 292 FtpDirectoryListingEntry FtpLsDirectoryListingParser::PopEntry() { |
152 FtpDirectoryListingEntry entry = entries_.front(); | 293 FtpDirectoryListingEntry entry = entries_.front(); |
153 entries_.pop(); | 294 entries_.pop(); |
154 return entry; | 295 return entry; |
155 } | 296 } |
156 | 297 |
| 298 FtpVmsDirectoryListingParser::FtpVmsDirectoryListingParser() |
| 299 : state_(STATE_INITIAL), |
| 300 last_is_directory_(false) { |
| 301 } |
| 302 |
| 303 bool FtpVmsDirectoryListingParser::ConsumeLine(const string16& line) { |
| 304 switch (state_) { |
| 305 case STATE_INITIAL: |
| 306 DCHECK(last_filename_.empty()); |
| 307 if (line.empty()) |
| 308 return true; |
| 309 if (StartsWith(line, ASCIIToUTF16("Total of "), true)) { |
| 310 state_ = STATE_END; |
| 311 return true; |
| 312 } |
| 313 // We assume that the first non-empty line is the listing header. It often |
| 314 // starts with "Directory ", but not always. |
| 315 state_ = STATE_RECEIVED_HEADER; |
| 316 return true; |
| 317 case STATE_RECEIVED_HEADER: |
| 318 DCHECK(last_filename_.empty()); |
| 319 if (line.empty()) |
| 320 return true; |
| 321 state_ = STATE_ENTRIES; |
| 322 return ConsumeEntryLine(line); |
| 323 case STATE_ENTRIES: |
| 324 if (line.empty()) { |
| 325 if (!last_filename_.empty()) |
| 326 return false; |
| 327 state_ = STATE_RECEIVED_LAST_ENTRY; |
| 328 return true; |
| 329 } |
| 330 return ConsumeEntryLine(line); |
| 331 case STATE_RECEIVED_LAST_ENTRY: |
| 332 DCHECK(last_filename_.empty()); |
| 333 if (line.empty()) |
| 334 return true; |
| 335 if (!StartsWith(line, ASCIIToUTF16("Total of "), true)) |
| 336 return false; |
| 337 state_ = STATE_END; |
| 338 return true; |
| 339 case STATE_END: |
| 340 DCHECK(last_filename_.empty()); |
| 341 return false; |
| 342 default: |
| 343 NOTREACHED(); |
| 344 return false; |
| 345 } |
| 346 } |
| 347 |
| 348 bool FtpVmsDirectoryListingParser::EntryAvailable() const { |
| 349 return !entries_.empty(); |
| 350 } |
| 351 |
| 352 FtpDirectoryListingEntry FtpVmsDirectoryListingParser::PopEntry() { |
| 353 FtpDirectoryListingEntry entry = entries_.front(); |
| 354 entries_.pop(); |
| 355 return entry; |
| 356 } |
| 357 |
| 358 bool FtpVmsDirectoryListingParser::ConsumeEntryLine(const string16& line) { |
| 359 std::vector<string16> columns; |
| 360 SplitString(CollapseWhitespace(line, false), ' ', &columns); |
| 361 |
| 362 if (columns.size() == 1) { |
| 363 if (!last_filename_.empty()) |
| 364 return false; |
| 365 return ParseVmsFilename(columns[0], &last_filename_, &last_is_directory_); |
| 366 } |
| 367 |
| 368 // Recognize listing entries which generate "access denied" message even when |
| 369 // trying to list them. We don't display them in the final listing. |
| 370 static const char* kAccessDeniedMessages[] = { |
| 371 "%RMS-E-PRV", |
| 372 "privilege", |
| 373 }; |
| 374 for (size_t i = 0; i < arraysize(kAccessDeniedMessages); i++) { |
| 375 if (line.find(ASCIIToUTF16(kAccessDeniedMessages[i])) != string16::npos) { |
| 376 last_filename_.clear(); |
| 377 last_is_directory_ = false; |
| 378 return true; |
| 379 } |
| 380 } |
| 381 |
| 382 string16 filename; |
| 383 bool is_directory = false; |
| 384 if (last_filename_.empty()) { |
| 385 if (!ParseVmsFilename(columns[0], &filename, &is_directory)) |
| 386 return false; |
| 387 columns.erase(columns.begin()); |
| 388 } else { |
| 389 filename = last_filename_; |
| 390 is_directory = last_is_directory_; |
| 391 last_filename_.clear(); |
| 392 last_is_directory_ = false; |
| 393 } |
| 394 |
| 395 if (columns.size() > 5) |
| 396 return false; |
| 397 |
| 398 if (columns.size() == 5) { |
| 399 if (!LooksLikeVmsFileProtectionListing(columns[4])) |
| 400 return false; |
| 401 if (!LooksLikeVmsUserIdentificationCode(columns[3])) |
| 402 return false; |
| 403 columns.resize(3); |
| 404 } |
| 405 |
| 406 if (columns.size() != 3) |
| 407 return false; |
| 408 |
| 409 FtpDirectoryListingEntry entry; |
| 410 entry.name = filename; |
| 411 entry.type = is_directory ? FtpDirectoryListingEntry::DIRECTORY |
| 412 : FtpDirectoryListingEntry::FILE; |
| 413 if (!ParseVmsFilesize(columns[0], &entry.size)) |
| 414 return false; |
| 415 if (entry.size < 0) |
| 416 return false; |
| 417 if (entry.type != FtpDirectoryListingEntry::FILE) |
| 418 entry.size = -1; |
| 419 if (!VmsDateListingToTime(columns, &entry.last_modified)) |
| 420 return false; |
| 421 |
| 422 entries_.push(entry); |
| 423 return true; |
| 424 } |
| 425 |
157 } // namespace net | 426 } // namespace net |
OLD | NEW |