net/ftp/ftp_util.cc - platform/external/chromium - Git at Google

 // Copyright (c) 2011 The Chromium Authors. All rights reserved.
 // Use of this source code is governed by a BSD-style license that can be
 // found in the LICENSE file.

 #include "net/ftp/ftp_util.h"

 #include <vector>

 #include "base/i18n/char_iterator.h"
 #include "base/logging.h"
 #include "base/string_number_conversions.h"
 #include "base/string_tokenizer.h"
 #include "base/string_util.h"
 #include "base/time.h"
 #include "base/utf_string_conversions.h"
 #include "unicode/datefmt.h"
 #include "unicode/dtfmtsym.h"
 #include "unicode/uchar.h"

 // For examples of Unix<->VMS path conversions, see the unit test file. On VMS
 // a path looks differently depending on whether it's a file or directory.

 namespace net {

 // static
 std::string FtpUtil::UnixFilePathToVMS(const std::string& unix_path) {
   if (unix_path.empty())
     return std::string();

   StringTokenizer tokenizer(unix_path, "/");
   std::vector<std::string> tokens;
   while (tokenizer.GetNext())
     tokens.push_back(tokenizer.token());

   if (unix_path[0] == '/') {
     // It's an absolute path.

     if (tokens.empty()) {
       DCHECK_EQ(1U, unix_path.length());
       return "[]";
     }

     if (tokens.size() == 1)
       return unix_path.substr(1);  // Drop the leading slash.

     std::string result(tokens[0] + ":[");
     if (tokens.size() == 2) {
       // Don't ask why, it just works that way on VMS.
       result.append("000000");
     } else {
       result.append(tokens[1]);
       for (size_t i = 2; i < tokens.size() - 1; i++)
         result.append("." + tokens[i]);
     }
     result.append("]" + tokens[tokens.size() - 1]);
     return result;
   }

   if (tokens.size() == 1)
     return unix_path;

   std::string result("[");
   for (size_t i = 0; i < tokens.size() - 1; i++)
     result.append("." + tokens[i]);
   result.append("]" + tokens[tokens.size() - 1]);
   return result;
 }

 // static
 std::string FtpUtil::UnixDirectoryPathToVMS(const std::string& unix_path) {
   if (unix_path.empty())
     return std::string();

   std::string path(unix_path);

   if (path[path.length() - 1] != '/')
     path.append("/");

   // Reuse logic from UnixFilePathToVMS by appending a fake file name to the
   // real path and removing it after conversion.
   path.append("x");
   path = UnixFilePathToVMS(path);
   return path.substr(0, path.length() - 1);
 }

 // static
 std::string FtpUtil::VMSPathToUnix(const std::string& vms_path) {
   if (vms_path.empty())
     return ".";

   if (vms_path == "[]")
     return "/";

   std::string result(vms_path);
   if (vms_path[0] == '[') {
     // It's a relative path.
     ReplaceFirstSubstringAfterOffset(&result, 0, "[.", "");
   } else {
     // It's an absolute path.
     result.insert(0, "/");
     ReplaceSubstringsAfterOffset(&result, 0, ":[000000]", "/");
     ReplaceSubstringsAfterOffset(&result, 0, ":[", "/");
   }
   std::replace(result.begin(), result.end(), '.', '/');
   std::replace(result.begin(), result.end(), ']', '/');

   // Make sure the result doesn't end with a slash.
   if (result.length() && result[result.length() - 1] == '/')
     result = result.substr(0, result.length() - 1);

   return result;
 }

 // static
 bool FtpUtil::AbbreviatedMonthToNumber(const string16& text, int* number) {
   icu::UnicodeString unicode_text(text.data(), text.size());

   int32_t locales_count;
   const icu::Locale* locales =
       icu::DateFormat::getAvailableLocales(locales_count);

   // Some FTP servers localize the date listings. To guess the locale,
   // we loop over all available ones.
   for (int32_t locale = 0; locale < locales_count; locale++) {
     UErrorCode status(U_ZERO_ERROR);

     icu::DateFormatSymbols format_symbols(locales[locale], status);

     // If we cannot get format symbols for some locale, it's not a fatal error.
     // Just try another one.
     if (U_FAILURE(status))
       continue;

     int32_t months_count;
     const icu::UnicodeString* months =
         format_symbols.getShortMonths(months_count);

     // Loop over all abbreviated month names in given locale.
     // An alternative solution (to parse |text| in given locale) is more
     // lenient, and may accept more than we want even with setLenient(false).
     for (int32_t month = 0; month < months_count; month++) {
       // Compare (case-insensitive), but just first three characters. Sometimes
       // ICU returns longer strings (for example for Russian locale), and in FTP
       // listings they are abbreviated to just three characters.
       // Note: ICU may also return strings shorter than three characters,
       // and those also should be accepted.
       if (months[month].caseCompare(0, 3, unicode_text, 0) == 0) {
         *number = month + 1;
         return true;
       }
     }
   }

   return false;
 }

 // static
 bool FtpUtil::LsDateListingToTime(const string16& month, const string16& day,
                                   const string16& rest,
                                   const base::Time& current_time,
                                   base::Time* result) {
   base::Time::Exploded time_exploded = { 0 };

   if (!AbbreviatedMonthToNumber(month, &time_exploded.month))
     return false;

   if (!base::StringToInt(day, &time_exploded.day_of_month))
     return false;
   if (time_exploded.day_of_month > 31)
     return false;

   if (!base::StringToInt(rest, &time_exploded.year)) {
     // Maybe it's time. Does it look like time (HH:MM)?
     if (rest.length() == 5 && rest[2] == ':') {
       if (!base::StringToInt(rest.begin(),
                              rest.begin() + 2,
                              &time_exploded.hour))
         return false;

       if (!base::StringToInt(rest.begin() + 3,
                              rest.begin() + 5,
                              &time_exploded.minute))
         return false;
     } else if (rest.length() == 4 && rest[1] == ':') {
       // Sometimes it's just H:MM.
       if (!base::StringToInt(rest.begin(),
                              rest.begin() + 1,
                              &time_exploded.hour))
         return false;

       if (!base::StringToInt(rest.begin() + 2,
                              rest.begin() + 4,
                              &time_exploded.minute))
         return false;
     } else {
       return false;
     }

     // Guess the year.
     base::Time::Exploded current_exploded;
     current_time.LocalExplode(&current_exploded);

     // If it's not possible for the parsed date to be in the current year,
     // use the previous year.
     if (time_exploded.month > current_exploded.month ||
         (time_exploded.month == current_exploded.month &&
          time_exploded.day_of_month > current_exploded.day_of_month)) {
       time_exploded.year = current_exploded.year - 1;
     } else {
       time_exploded.year = current_exploded.year;
     }
   }

   // We don't know the time zone of the listing, so just use local time.
   *result = base::Time::FromLocalExploded(time_exploded);
   return true;
 }

 // static
 string16 FtpUtil::GetStringPartAfterColumns(const string16& text, int columns) {
   base::i18n::UTF16CharIterator iter(&text);

   // TODO(jshin): Is u_isspace the right function to use here?
   for (int i = 0; i < columns; i++) {
     // Skip the leading whitespace.
     while (!iter.end() && u_isspace(iter.get()))
       iter.Advance();

     // Skip the actual text of i-th column.
     while (!iter.end() && !u_isspace(iter.get()))
       iter.Advance();
   }

   string16 result(text.substr(iter.array_pos()));
   TrimWhitespace(result, TRIM_ALL, &result);
   return result;
 }

 }  // namespace
	// Copyright (c) 2011 The Chromium Authors. All rights reserved.
	// Use of this source code is governed by a BSD-style license that can be
	// found in the LICENSE file.

	#include "net/ftp/ftp_util.h"

	#include <vector>

	#include "base/i18n/char_iterator.h"
	#include "base/logging.h"
	#include "base/string_number_conversions.h"
	#include "base/string_tokenizer.h"
	#include "base/string_util.h"
	#include "base/time.h"
	#include "base/utf_string_conversions.h"
	#include "unicode/datefmt.h"
	#include "unicode/dtfmtsym.h"
	#include "unicode/uchar.h"

	// For examples of Unix<->VMS path conversions, see the unit test file. On VMS
	// a path looks differently depending on whether it's a file or directory.

	namespace net {

	// static
	std::string FtpUtil::UnixFilePathToVMS(const std::string& unix_path) {
	if (unix_path.empty())
	return std::string();

	StringTokenizer tokenizer(unix_path, "/");
	std::vector<std::string> tokens;
	while (tokenizer.GetNext())
	tokens.push_back(tokenizer.token());

	if (unix_path[0] == '/') {
	// It's an absolute path.

	if (tokens.empty()) {
	DCHECK_EQ(1U, unix_path.length());
	return "[]";
	}

	if (tokens.size() == 1)
	return unix_path.substr(1); // Drop the leading slash.

	std::string result(tokens[0] + ":[");
	if (tokens.size() == 2) {
	// Don't ask why, it just works that way on VMS.
	result.append("000000");
	} else {
	result.append(tokens[1]);
	for (size_t i = 2; i < tokens.size() - 1; i++)
	result.append("." + tokens[i]);
	}
	result.append("]" + tokens[tokens.size() - 1]);
	return result;
	}

	if (tokens.size() == 1)
	return unix_path;

	std::string result("[");
	for (size_t i = 0; i < tokens.size() - 1; i++)
	result.append("." + tokens[i]);
	result.append("]" + tokens[tokens.size() - 1]);
	return result;
	}

	// static
	std::string FtpUtil::UnixDirectoryPathToVMS(const std::string& unix_path) {
	if (unix_path.empty())
	return std::string();

	std::string path(unix_path);

	if (path[path.length() - 1] != '/')
	path.append("/");

	// Reuse logic from UnixFilePathToVMS by appending a fake file name to the
	// real path and removing it after conversion.
	path.append("x");
	path = UnixFilePathToVMS(path);
	return path.substr(0, path.length() - 1);
	}

	// static
	std::string FtpUtil::VMSPathToUnix(const std::string& vms_path) {
	if (vms_path.empty())
	return ".";

	if (vms_path == "[]")
	return "/";

	std::string result(vms_path);
	if (vms_path[0] == '[') {
	// It's a relative path.
	ReplaceFirstSubstringAfterOffset(&result, 0, "[.", "");
	} else {
	// It's an absolute path.
	result.insert(0, "/");
	ReplaceSubstringsAfterOffset(&result, 0, ":[000000]", "/");
	ReplaceSubstringsAfterOffset(&result, 0, ":[", "/");
	}
	std::replace(result.begin(), result.end(), '.', '/');
	std::replace(result.begin(), result.end(), ']', '/');

	// Make sure the result doesn't end with a slash.
	if (result.length() && result[result.length() - 1] == '/')
	result = result.substr(0, result.length() - 1);

	return result;
	}

	// static
	bool FtpUtil::AbbreviatedMonthToNumber(const string16& text, int* number) {
	icu::UnicodeString unicode_text(text.data(), text.size());

	int32_t locales_count;
	const icu::Locale* locales =
	icu::DateFormat::getAvailableLocales(locales_count);

	// Some FTP servers localize the date listings. To guess the locale,
	// we loop over all available ones.
	for (int32_t locale = 0; locale < locales_count; locale++) {
	UErrorCode status(U_ZERO_ERROR);

	icu::DateFormatSymbols format_symbols(locales[locale], status);

	// If we cannot get format symbols for some locale, it's not a fatal error.
	// Just try another one.
	if (U_FAILURE(status))
	continue;

	int32_t months_count;
	const icu::UnicodeString* months =
	format_symbols.getShortMonths(months_count);

	// Loop over all abbreviated month names in given locale.
	// An alternative solution (to parse \|text\| in given locale) is more
	// lenient, and may accept more than we want even with setLenient(false).
	for (int32_t month = 0; month < months_count; month++) {
	// Compare (case-insensitive), but just first three characters. Sometimes
	// ICU returns longer strings (for example for Russian locale), and in FTP
	// listings they are abbreviated to just three characters.
	// Note: ICU may also return strings shorter than three characters,
	// and those also should be accepted.
	if (months[month].caseCompare(0, 3, unicode_text, 0) == 0) {
	*number = month + 1;
	return true;
	}
	}
	}

	return false;
	}

	// static
	bool FtpUtil::LsDateListingToTime(const string16& month, const string16& day,
	const string16& rest,
	const base::Time& current_time,
	base::Time* result) {
	base::Time::Exploded time_exploded = { 0 };

	if (!AbbreviatedMonthToNumber(month, &time_exploded.month))
	return false;

	if (!base::StringToInt(day, &time_exploded.day_of_month))
	return false;
	if (time_exploded.day_of_month > 31)
	return false;

	if (!base::StringToInt(rest, &time_exploded.year)) {
	// Maybe it's time. Does it look like time (HH:MM)?
	if (rest.length() == 5 && rest[2] == ':') {
	if (!base::StringToInt(rest.begin(),
	rest.begin() + 2,
	&time_exploded.hour))
	return false;

	if (!base::StringToInt(rest.begin() + 3,
	rest.begin() + 5,
	&time_exploded.minute))
	return false;
	} else if (rest.length() == 4 && rest[1] == ':') {
	// Sometimes it's just H:MM.
	if (!base::StringToInt(rest.begin(),
	rest.begin() + 1,
	&time_exploded.hour))
	return false;

	if (!base::StringToInt(rest.begin() + 2,
	rest.begin() + 4,
	&time_exploded.minute))
	return false;
	} else {
	return false;
	}

	// Guess the year.
	base::Time::Exploded current_exploded;
	current_time.LocalExplode(&current_exploded);

	// If it's not possible for the parsed date to be in the current year,
	// use the previous year.
	if (time_exploded.month > current_exploded.month \|\|
	(time_exploded.month == current_exploded.month &&
	time_exploded.day_of_month > current_exploded.day_of_month)) {
	time_exploded.year = current_exploded.year - 1;
	} else {
	time_exploded.year = current_exploded.year;
	}
	}

	// We don't know the time zone of the listing, so just use local time.
	*result = base::Time::FromLocalExploded(time_exploded);
	return true;
	}

	// static
	string16 FtpUtil::GetStringPartAfterColumns(const string16& text, int columns) {
	base::i18n::UTF16CharIterator iter(&text);

	// TODO(jshin): Is u_isspace the right function to use here?
	for (int i = 0; i < columns; i++) {
	// Skip the leading whitespace.
	while (!iter.end() && u_isspace(iter.get()))
	iter.Advance();

	// Skip the actual text of i-th column.
	while (!iter.end() && !u_isspace(iter.get()))
	iter.Advance();
	}

	string16 result(text.substr(iter.array_pos()));
	TrimWhitespace(result, TRIM_ALL, &result);
	return result;
	}

	} // namespace