Chromium Code Reviews

Side by Side Diff: net/ftp/ftp_directory_listing_parsers.cc

Issue 348036: Implement VMS FTP directory listing parser. (Closed)
Patch Set: fix Created 11 years, 1 month ago
Use n/p to move between diff chunks; N/P to move between comments.
Jump to:
View unified diff |
OLDNEW
1 // Copyright (c) 2009 The Chromium Authors. All rights reserved. Use of this 1 // Copyright (c) 2009 The Chromium Authors. All rights reserved. Use of this
2 // source code is governed by a BSD-style license that can be found in the 2 // source code is governed by a BSD-style license that can be found in the
3 // LICENSE file. 3 // LICENSE file.
4 4
5 #include "net/ftp/ftp_directory_listing_parsers.h" 5 #include "net/ftp/ftp_directory_listing_parsers.h"
6 6
7 #include "base/string_util.h" 7 #include "base/string_util.h"
8 8
9 namespace { 9 namespace {
10 10
11 bool LooksLikeUnixPermission(const string16& text) { 11 bool LooksLikeUnixPermission(const string16& text) {
12 if (text.length() != 3) 12 if (text.length() != 3)
13 return false; 13 return false;
14 14
15 return ((text[0] == 'r' || text[0] == '-') && 15 return ((text[0] == 'r' || text[0] == '-') &&
16 (text[1] == 'w' || text[1] == '-') && 16 (text[1] == 'w' || text[1] == '-') &&
17 (text[2] == 'x' || text[2] == 's' || text[2] == 'S' || 17 (text[2] == 'x' || text[2] == 's' || text[2] == 'S' ||
18 text[2] == '-')); 18 text[2] == '-'));
19 } 19 }
20 20
21 bool LooksLikeUnixPermissionsListing(const string16& text) { 21 bool LooksLikeUnixPermissionsListing(const string16& text) {
22 if (text.length() != 10) 22 if (text.length() != 10)
23 return false; 23 return false;
24 24
25 if (text[0] != 'b' && text[0] != 'c' && text[0] != 'd' && 25 if (text[0] != 'b' && text[0] != 'c' && text[0] != 'd' &&
26 text[0] != 'l' && text[0] != 'p' && text[0] != 's' && 26 text[0] != 'l' && text[0] != 'p' && text[0] != 's' &&
27 text[0] != '-') 27 text[0] != '-')
28 return false; 28 return false;
29 29
30 return (LooksLikeUnixPermission(text.substr(1, 3)) && 30 return (LooksLikeUnixPermission(text.substr(1, 3)) &&
31 LooksLikeUnixPermission(text.substr(4, 3)) && 31 LooksLikeUnixPermission(text.substr(4, 3)) &&
32 LooksLikeUnixPermission(text.substr(7, 3))); 32 LooksLikeUnixPermission(text.substr(7, 3)));
33 } 33 }
34 34
35 bool IsStringNonNegativeNumber(const string16& text) { 35 bool IsStringNonNegativeInteger(const string16& text) {
36 int number; 36 int number;
37 if (!StringToInt(text, &number)) 37 if (!StringToInt(text, &number))
38 return false; 38 return false;
39 39
40 return number >= 0; 40 return number >= 0;
41 } 41 }
42 42
43 bool ThreeLetterMonthToNumber(const string16& text, int* number) { 43 bool ThreeLetterMonthToNumber(const string16& text, int* number) {
44 const static char* months[] = { "jan", "feb", "mar", "apr", "may", "jun", 44 const static char* months[] = { "jan", "feb", "mar", "apr", "may", "jun",
45 "jul", "aug", "sep", "oct", "nov", "dec" }; 45 "jul", "aug", "sep", "oct", "nov", "dec" };
46 46
47 for (size_t i = 0; i < arraysize(months); i++) { 47 for (size_t i = 0; i < arraysize(months); i++) {
48 if (LowerCaseEqualsASCII(text, months[i])) { 48 if (LowerCaseEqualsASCII(text, months[i])) {
49 *number = i + 1; 49 *number = i + 1;
50 return true; 50 return true;
51 } 51 }
52 } 52 }
53 53
54 return false; 54 return false;
55 } 55 }
56 56
57 bool UnixDateListingToTime(const std::vector<string16>& columns, 57 bool UnixDateListingToTime(const std::vector<string16>& columns,
58 base::Time* time) { 58 base::Time* time) {
59 DCHECK_EQ(9U, columns.size()); 59 DCHECK_EQ(9U, columns.size());
60 60
61 base::Time::Exploded time_exploded = { 0 }; 61 base::Time::Exploded time_exploded = { 0 };
62 62
63 if (!ThreeLetterMonthToNumber(columns[5], &time_exploded.month)) 63 if (!ThreeLetterMonthToNumber(columns[5], &time_exploded.month))
64 return false; 64 return false;
65 65
66 if (!StringToInt(columns[6], &time_exploded.day_of_month)) 66 if (!StringToInt(columns[6], &time_exploded.day_of_month))
67 return false; 67 return false;
68 68
69 if (!StringToInt(columns[7], &time_exploded.year)) { 69 if (!StringToInt(columns[7], &time_exploded.year)) {
70 // Maybe it's time. Does it look like time (MM:HH)? 70 // Maybe it's time. Does it look like time (MM:HH)?
71 if (columns[7].length() != 5 || columns[7][2] != ':') 71 if (columns[7].length() != 5 || columns[7][2] != ':')
72 return false; 72 return false;
73 73
74 if (!StringToInt(columns[7].substr(0, 2), &time_exploded.hour)) 74 if (!StringToInt(columns[7].substr(0, 2), &time_exploded.hour))
75 return false; 75 return false;
76 76
77 if (!StringToInt(columns[7].substr(3, 2), &time_exploded.minute)) 77 if (!StringToInt(columns[7].substr(3, 2), &time_exploded.minute))
78 return false; 78 return false;
79 79
80 // Use current year. 80 // Use current year.
81 base::Time::Exploded now_exploded; 81 base::Time::Exploded now_exploded;
82 base::Time::Now().LocalExplode(&now_exploded); 82 base::Time::Now().LocalExplode(&now_exploded);
83 time_exploded.year = now_exploded.year; 83 time_exploded.year = now_exploded.year;
84 } 84 }
85 85
86 // We don't know the time zone of the server, so just use local time. 86 // We don't know the time zone of the server, so just use local time.
87 *time = base::Time::FromLocalExploded(time_exploded); 87 *time = base::Time::FromLocalExploded(time_exploded);
88 return true; 88 return true;
89 } 89 }
90 90
91 // Converts the filename component in listing to the filename we can display.
92 // Returns true on success.
93 bool ParseVmsFilename(const string16& raw_filename, string16* parsed_filename,
94 bool* is_directory) {
95 // On VMS, the files and directories are versioned. The version number is
96 // separated from the file name by a semicolon. Example: ANNOUNCE.TXT;2.
97 std::vector<string16> listing_parts;
98 SplitString(raw_filename, ';', &listing_parts);
99 if (listing_parts.size() != 2)
100 return false;
101 if (!IsStringNonNegativeInteger(listing_parts[1]))
102 return false;
103
104 // Even directories have extensions in the listings. Don't display extensions
105 // for directories; it's awkward for non-VMS users. Also, VMS is
106 // case-insensitive, but generally uses uppercase characters. This may look
107 // awkward, so we convert them to lower case.
108 std::vector<string16> filename_parts;
109 SplitString(listing_parts[0], '.', &filename_parts);
110 if (filename_parts.size() != 2)
111 return false;
112 if (filename_parts[1] == ASCIIToUTF16("DIR")) {
113 *parsed_filename = StringToLowerASCII(filename_parts[0]);
114 *is_directory = true;
115 } else {
116 *parsed_filename = StringToLowerASCII(listing_parts[0]);
117 *is_directory = false;
118 }
119 return true;
120 }
121
122 bool ParseVmsFilesize(const string16& input, int64* size) {
123 // VMS's directory listing gives us file size in blocks. We assume that
124 // the block size is 512 bytes. It doesn't give accurate file size, but is the
125 // best information we have.
126 const int kBlockSize = 512;
127
128 if (StringToInt64(input, size)) {
129 *size *= kBlockSize;
130 return true;
131 }
132
133 std::vector<string16> parts;
134 SplitString(input, '/', &parts);
135 if (parts.size() != 2)
136 return false;
137
138 int64 blocks_used, blocks_allocated;
139 if (!StringToInt64(parts[0], &blocks_used))
140 return false;
141 if (!StringToInt64(parts[1], &blocks_allocated))
142 return false;
143 if (blocks_used > blocks_allocated)
144 return false;
145
146 *size = blocks_used * kBlockSize;
147 return true;
148 }
149
150 bool LooksLikeVmsFileProtectionListingPart(const string16& input) {
151 if (input.length() > 4)
152 return false;
153
154 // On VMS there are four different permission bits: Read, Write, Execute,
155 // and Delete. They appear in that order in the permission listing.
156 std::string pattern("RWED");
157 string16 match(input);
158 while (!match.empty() && !pattern.empty()) {
159 if (match[0] == pattern[0])
160 match = match.substr(1);
161 pattern = pattern.substr(1);
162 }
163 return match.empty();
164 }
165
166 bool LooksLikeVmsFileProtectionListing(const string16& input) {
167 if (input.length() < 2)
168 return false;
169 if (input[0] != '(' || input[input.length() - 1] != ')')
170 return false;
171
172 // We expect four parts of the file protection listing: for System, Owner,
173 // Group, and World.
174 std::vector<string16> parts;
175 SplitString(input.substr(1, input.length() - 2), ',', &parts);
176 if (parts.size() != 4)
177 return false;
178
179 return LooksLikeVmsFileProtectionListingPart(parts[0]) &&
180 LooksLikeVmsFileProtectionListingPart(parts[1]) &&
181 LooksLikeVmsFileProtectionListingPart(parts[2]) &&
182 LooksLikeVmsFileProtectionListingPart(parts[3]);
183 }
184
185 bool LooksLikeVmsUserIdentificationCode(const string16& input) {
186 if (input.length() < 2)
187 return false;
188 return input[0] == '[' && input[input.length() - 1] == ']';
189 }
190
191 bool VmsDateListingToTime(const std::vector<string16>& columns,
192 base::Time* time) {
193 DCHECK_EQ(3U, columns.size());
194
195 base::Time::Exploded time_exploded = { 0 };
196
197 // Date should be in format DD-MMM-YYYY.
198 std::vector<string16> date_parts;
199 SplitString(columns[1], '-', &date_parts);
200 if (date_parts.size() != 3)
201 return false;
202 if (!StringToInt(date_parts[0], &time_exploded.day_of_month))
203 return false;
204 if (!ThreeLetterMonthToNumber(date_parts[1], &time_exploded.month))
205 return false;
206 if (!StringToInt(date_parts[2], &time_exploded.year))
207 return false;
208
209 // Time can be in format HH:MM, HH:MM:SS, or HH:MM:SS.mm. Try to recognize the
210 // last type first. Do not parse the seconds, they will be ignored anyway.
211 string16 time_column(columns[2]);
212 if (time_column.length() == 11 && time_column[8] == '.')
213 time_column = time_column.substr(0, 8);
214 if (time_column.length() == 8 && time_column[5] == ':')
215 time_column = time_column.substr(0, 5);
216 if (time_column.length() != 5)
217 return false;
218 std::vector<string16> time_parts;
219 SplitString(time_column, ':', &time_parts);
220 if (time_parts.size() != 2)
221 return false;
222 if (!StringToInt(time_parts[0], &time_exploded.hour))
223 return false;
224 if (!StringToInt(time_parts[1], &time_exploded.minute))
225 return false;
226
227 // We don't know the time zone of the server, so just use local time.
228 *time = base::Time::FromLocalExploded(time_exploded);
229 return true;
230 }
231
91 } // namespace 232 } // namespace
92 233
93 namespace net { 234 namespace net {
94 235
95 FtpDirectoryListingParser::~FtpDirectoryListingParser() { 236 FtpDirectoryListingParser::~FtpDirectoryListingParser() {
96 } 237 }
97 238
98 FtpLsDirectoryListingParser::FtpLsDirectoryListingParser() { 239 FtpLsDirectoryListingParser::FtpLsDirectoryListingParser() {
99 } 240 }
100 241
101 bool FtpLsDirectoryListingParser::ConsumeLine(const string16& line) { 242 bool FtpLsDirectoryListingParser::ConsumeLine(const string16& line) {
102 std::vector<string16> columns; 243 std::vector<string16> columns;
103 SplitString(CollapseWhitespace(line, false), ' ', &columns); 244 SplitString(CollapseWhitespace(line, false), ' ', &columns);
104 if (columns.size() == 11) { 245 if (columns.size() == 11) {
105 // Check if it is a symlink. 246 // Check if it is a symlink.
106 if (columns[9] != ASCIIToUTF16("->")) 247 if (columns[9] != ASCIIToUTF16("->"))
107 return false; 248 return false;
108 249
109 // Drop the symlink target from columns, we don't use it. 250 // Drop the symlink target from columns, we don't use it.
110 columns.resize(9); 251 columns.resize(9);
111 } 252 }
112 253
113 if (columns.size() != 9) 254 if (columns.size() != 9)
114 return false; 255 return false;
115 256
116 if (!LooksLikeUnixPermissionsListing(columns[0])) 257 if (!LooksLikeUnixPermissionsListing(columns[0]))
117 return false; 258 return false;
118 259
119 FtpDirectoryListingEntry entry; 260 FtpDirectoryListingEntry entry;
120 if (columns[0][0] == 'l') { 261 if (columns[0][0] == 'l') {
121 entry.type = FtpDirectoryListingEntry::SYMLINK; 262 entry.type = FtpDirectoryListingEntry::SYMLINK;
122 } else if (columns[0][0] == 'd') { 263 } else if (columns[0][0] == 'd') {
123 entry.type = FtpDirectoryListingEntry::DIRECTORY; 264 entry.type = FtpDirectoryListingEntry::DIRECTORY;
124 } else { 265 } else {
125 entry.type = FtpDirectoryListingEntry::FILE; 266 entry.type = FtpDirectoryListingEntry::FILE;
126 } 267 }
127 268
128 if (!IsStringNonNegativeNumber(columns[1])) 269 if (!IsStringNonNegativeInteger(columns[1]))
129 return false; 270 return false;
130 271
131 if (!StringToInt64(columns[4], &entry.size)) 272 if (!StringToInt64(columns[4], &entry.size))
132 return false; 273 return false;
133 if (entry.size < 0) 274 if (entry.size < 0)
134 return false; 275 return false;
135 if (entry.type != FtpDirectoryListingEntry::FILE) 276 if (entry.type != FtpDirectoryListingEntry::FILE)
136 entry.size = -1; 277 entry.size = -1;
137 278
138 if (!UnixDateListingToTime(columns, &entry.last_modified)) 279 if (!UnixDateListingToTime(columns, &entry.last_modified))
139 return false; 280 return false;
140 281
141 entry.name = columns[8]; 282 entry.name = columns[8];
142 283
143 entries_.push(entry); 284 entries_.push(entry);
144 return true; 285 return true;
145 } 286 }
146 287
147 bool FtpLsDirectoryListingParser::EntryAvailable() const { 288 bool FtpLsDirectoryListingParser::EntryAvailable() const {
148 return !entries_.empty(); 289 return !entries_.empty();
149 } 290 }
150 291
151 FtpDirectoryListingEntry FtpLsDirectoryListingParser::PopEntry() { 292 FtpDirectoryListingEntry FtpLsDirectoryListingParser::PopEntry() {
152 FtpDirectoryListingEntry entry = entries_.front(); 293 FtpDirectoryListingEntry entry = entries_.front();
153 entries_.pop(); 294 entries_.pop();
154 return entry; 295 return entry;
155 } 296 }
156 297
298 FtpVmsDirectoryListingParser::FtpVmsDirectoryListingParser()
299 : state_(STATE_INITIAL),
300 last_is_directory_(false) {
301 }
302
303 bool FtpVmsDirectoryListingParser::ConsumeLine(const string16& line) {
304 switch (state_) {
305 case STATE_INITIAL:
306 DCHECK(last_filename_.empty());
307 if (line.empty())
308 return true;
309 if (StartsWith(line, ASCIIToUTF16("Total of "), true)) {
310 state_ = STATE_END;
311 return true;
312 }
313 // We assume that the first non-empty line is the listing header. It often
314 // starts with "Directory ", but not always.
315 state_ = STATE_RECEIVED_HEADER;
316 return true;
317 case STATE_RECEIVED_HEADER:
318 DCHECK(last_filename_.empty());
319 if (line.empty())
320 return true;
321 state_ = STATE_ENTRIES;
322 return ConsumeEntryLine(line);
323 case STATE_ENTRIES:
324 if (line.empty()) {
325 if (!last_filename_.empty())
326 return false;
327 state_ = STATE_RECEIVED_LAST_ENTRY;
328 return true;
329 }
330 return ConsumeEntryLine(line);
331 case STATE_RECEIVED_LAST_ENTRY:
332 DCHECK(last_filename_.empty());
333 if (line.empty())
334 return true;
335 if (!StartsWith(line, ASCIIToUTF16("Total of "), true))
336 return false;
337 state_ = STATE_END;
338 return true;
339 case STATE_END:
340 DCHECK(last_filename_.empty());
341 return false;
342 default:
343 NOTREACHED();
344 return false;
345 }
346 }
347
348 bool FtpVmsDirectoryListingParser::EntryAvailable() const {
349 return !entries_.empty();
350 }
351
352 FtpDirectoryListingEntry FtpVmsDirectoryListingParser::PopEntry() {
353 FtpDirectoryListingEntry entry = entries_.front();
354 entries_.pop();
355 return entry;
356 }
357
358 bool FtpVmsDirectoryListingParser::ConsumeEntryLine(const string16& line) {
359 std::vector<string16> columns;
360 SplitString(CollapseWhitespace(line, false), ' ', &columns);
361
362 if (columns.size() == 1) {
363 if (!last_filename_.empty())
364 return false;
365 return ParseVmsFilename(columns[0], &last_filename_, &last_is_directory_);
366 }
367
368 // Recognize listing entries which generate "access denied" message even when
369 // trying to list them. We don't display them in the final listing.
370 static const char* kAccessDeniedMessages[] = {
371 "%RMS-E-PRV",
372 "privilege",
373 };
374 for (size_t i = 0; i < arraysize(kAccessDeniedMessages); i++) {
375 if (line.find(ASCIIToUTF16(kAccessDeniedMessages[i])) != string16::npos) {
376 last_filename_.clear();
377 last_is_directory_ = false;
378 return true;
379 }
380 }
381
382 string16 filename;
383 bool is_directory = false;
384 if (last_filename_.empty()) {
385 if (!ParseVmsFilename(columns[0], &filename, &is_directory))
386 return false;
387 columns.erase(columns.begin());
388 } else {
389 filename = last_filename_;
390 is_directory = last_is_directory_;
391 last_filename_.clear();
392 last_is_directory_ = false;
393 }
394
395 if (columns.size() > 5)
396 return false;
397
398 if (columns.size() == 5) {
399 if (!LooksLikeVmsFileProtectionListing(columns[4]))
400 return false;
401 if (!LooksLikeVmsUserIdentificationCode(columns[3]))
402 return false;
403 columns.resize(3);
404 }
405
406 if (columns.size() != 3)
407 return false;
408
409 FtpDirectoryListingEntry entry;
410 entry.name = filename;
411 entry.type = is_directory ? FtpDirectoryListingEntry::DIRECTORY
412 : FtpDirectoryListingEntry::FILE;
413 if (!ParseVmsFilesize(columns[0], &entry.size))
414 return false;
415 if (entry.size < 0)
416 return false;
417 if (entry.type != FtpDirectoryListingEntry::FILE)
418 entry.size = -1;
419 if (!VmsDateListingToTime(columns, &entry.last_modified))
420 return false;
421
422 entries_.push(entry);
423 return true;
424 }
425
157 } // namespace net 426 } // namespace net
OLDNEW
« no previous file with comments | « net/ftp/ftp_directory_listing_parsers.h ('k') | net/ftp/ftp_directory_listing_parsers_unittest.cc » ('j') | no next file with comments »

Powered by Google App Engine