#include "chrome/utility/importer/ie_importer_win.h"
#include <objbase.h>
#include <ole2.h>
#include <intshcut.h>
#include <shlobj.h>
#include <stddef.h>
#include <urlhist.h>
#include <wininet.h>
#include <wrl/client.h>
#include <algorithm>
#include <map>
#include <string>
#include <vector>
#include "base/compiler_specific.h"
#include "base/containers/contains.h"
#include "base/files/file_enumerator.h"
#include "base/files/file_path.h"
#include "base/files/file_util.h"
#include "base/logging.h"
#include "base/memory/raw_ptr.h"
#include "base/strings/string_split.h"
#include "base/strings/string_util.h"
#include "base/strings/utf_string_conversions.h"
#include "base/time/time.h"
#include "base/win/registry.h"
#include "base/win/scoped_co_mem.h"
#include "base/win/scoped_handle.h"
#include "base/win/scoped_propvariant.h"
#include "chrome/common/importer/edge_importer_utils_win.h"
#include "chrome/common/importer/ie_importer_utils_win.h"
#include "chrome/common/importer/importer_bridge.h"
#include "chrome/common/importer/pstore_declarations.h"
#include "chrome/grit/generated_resources.h"
#include "components/user_data_importer/common/imported_bookmark_entry.h"
#include "components/user_data_importer/common/importer_data_types.h"
#include "components/user_data_importer/common/importer_url_row.h"
#include "components/user_data_importer/content/favicon_reencode.h"
#include "ui/base/l10n/l10n_util.h"
#include "url/gurl.h"
#include "url/url_constants.h"
namespace {
const wchar_t kSearchScopePath[] =
L"Software\\Microsoft\\Internet Explorer\\SearchScopes";
const wchar_t kFaviconStreamName[] = L":favicon:$DATA";
base::Time GetFileCreationTime(const base::FilePath& file) {
base::Time creation_time;
base::win::ScopedHandle file_handle(CreateFile(
file.value().c_str(), GENERIC_READ,
FILE_SHARE_READ | FILE_SHARE_WRITE | FILE_SHARE_DELETE, NULL,
OPEN_EXISTING, FILE_ATTRIBUTE_NORMAL | FILE_FLAG_BACKUP_SEMANTICS, NULL));
FILETIME creation_filetime;
if (!file_handle.is_valid()) {
return creation_time;
}
if (GetFileTime(file_handle.Get(), &creation_filetime, NULL, NULL))
creation_time = base::Time::FromFileTime(creation_filetime);
return creation_time;
}
template <typename T>
bool BinaryRead(T* data, size_t offset, const std::vector<uint8_t>& blob) {
if (offset + sizeof(T) > blob.size())
return false;
UNSAFE_TODO(memcpy(data, &blob[offset], sizeof(T)));
return true;
}
LPCITEMIDLIST BinaryReadItemIDList(size_t offset,
size_t idlist_size,
const std::vector<uint8_t>& blob) {
size_t head = 0;
while (true) {
USHORT id_cb;
if (head >= idlist_size || !BinaryRead(&id_cb, offset + head, blob))
return NULL;
if (id_cb == 0)
break;
head += id_cb;
}
return reinterpret_cast<LPCITEMIDLIST>(&blob[offset]);
}
struct IEOrderBookmarkComparator {
bool operator()(const user_data_importer::ImportedBookmarkEntry& lhs,
const user_data_importer::ImportedBookmarkEntry& rhs) const {
static const uint32_t kNotSorted = 0xfffffffb;
base::FilePath lhs_prefix;
base::FilePath rhs_prefix;
for (size_t i = 0; i <= lhs.path.size() && i <= rhs.path.size(); ++i) {
const base::FilePath::StringType lhs_i =
(i < lhs.path.size() ? base::AsWString(lhs.path[i])
: base::AsWString(lhs.title) + L".url");
const base::FilePath::StringType rhs_i =
(i < rhs.path.size() ? base::AsWString(rhs.path[i])
: base::AsWString(rhs.title) + L".url");
lhs_prefix = lhs_prefix.Append(lhs_i);
rhs_prefix = rhs_prefix.Append(rhs_i);
if (lhs_i == rhs_i)
continue;
std::map<base::FilePath, uint32_t>::const_iterator lhs_iter =
sort_index_->find(lhs_prefix);
std::map<base::FilePath, uint32_t>::const_iterator rhs_iter =
sort_index_->find(rhs_prefix);
uint32_t lhs_sort_index =
(lhs_iter == sort_index_->end() ? kNotSorted : lhs_iter->second);
uint32_t rhs_sort_index =
(rhs_iter == sort_index_->end() ? kNotSorted : rhs_iter->second);
if (lhs_sort_index != rhs_sort_index)
return lhs_sort_index < rhs_sort_index;
return lhs_i < rhs_i;
}
return lhs.path.size() < rhs.path.size();
}
raw_ptr<const std::map<base::FilePath, uint32_t>> sort_index_;
};
[[nodiscard]] bool ParseFavoritesOrderBlob(
const Importer* importer,
const std::vector<uint8_t>& blob,
const base::FilePath& path,
std::map<base::FilePath, uint32_t>* sort_index) {
static const int kItemCountOffset = 16;
static const int kItemListStartOffset = 20;
uint32_t item_count = 0;
if (!BinaryRead(&item_count, kItemCountOffset, blob))
return false;
size_t base_offset = kItemListStartOffset;
for (uint32_t i = 0; i < item_count && !importer->cancelled(); ++i) {
static const int kSizeOffset = 0;
static const int kSortIndexOffset = 4;
static const int kItemIDListOffset = 8;
uint32_t item_size = 0;
if (!BinaryRead(&item_size, base_offset + kSizeOffset, blob) ||
base_offset + item_size <= base_offset ||
base_offset + item_size > blob.size())
return false;
uint32_t item_sort_index = 0;
if (!BinaryRead(&item_sort_index, base_offset + kSortIndexOffset, blob))
return false;
LPCITEMIDLIST idlist = BinaryReadItemIDList(
base_offset + kItemIDListOffset, item_size - kItemIDListOffset, blob);
TCHAR item_filename[MAX_PATH];
if (!idlist || !SHGetPathFromIDList(idlist, item_filename))
return false;
base::FilePath item_relative_path =
path.Append(base::FilePath(item_filename).BaseName());
sort_index->insert(std::make_pair(item_relative_path, item_sort_index));
base_offset += item_size;
}
return true;
}
[[nodiscard]] bool ParseFavoritesOrderRegistryTree(
const Importer* importer,
const base::win::RegKey& key,
const base::FilePath& path,
std::map<base::FilePath, uint32_t>* sort_index);
bool ParseFavoritesOrderRegistryTree(
const Importer* importer,
const base::win::RegKey& key,
const base::FilePath& path,
std::map<base::FilePath, uint32_t>* sort_index) {
DWORD blob_length = 0;
if (key.ReadValue(L"Order", NULL, &blob_length, NULL) == ERROR_SUCCESS) {
std::vector<uint8_t> blob(blob_length);
if (blob_length > 0 &&
key.ReadValue(L"Order", reinterpret_cast<DWORD*>(&blob[0]),
&blob_length, NULL) == ERROR_SUCCESS) {
if (!ParseFavoritesOrderBlob(importer, blob, path, sort_index))
return false;
}
}
for (base::win::RegistryKeyIterator child(key.Handle(), L"");
child.Valid() && !importer->cancelled(); ++child) {
base::win::RegKey subkey(key.Handle(), child.Name(), KEY_READ);
if (subkey.Valid()) {
base::FilePath subpath(path.Append(child.Name()));
if (!ParseFavoritesOrderRegistryTree(importer, subkey, subpath,
sort_index)) {
return false;
}
}
}
return true;
}
[[nodiscard]] bool ParseFavoritesOrderInfo(
const Importer* importer,
std::map<base::FilePath, uint32_t>* sort_index);
bool ParseFavoritesOrderInfo(const Importer* importer,
std::map<base::FilePath, uint32_t>* sort_index) {
std::wstring key_path(importer::GetIEFavoritesOrderKey());
base::win::RegKey key(HKEY_CURRENT_USER, key_path.c_str(), KEY_READ);
if (!key.Valid())
return false;
return ParseFavoritesOrderRegistryTree(importer, key, base::FilePath(),
sort_index);
}
void SortBookmarksInIEOrder(
const Importer* importer,
std::vector<user_data_importer::ImportedBookmarkEntry>* bookmarks) {
std::map<base::FilePath, uint32_t> sort_index;
if (!ParseFavoritesOrderInfo(importer, &sort_index))
return;
IEOrderBookmarkComparator compare = {&sort_index};
std::sort(bookmarks->begin(), bookmarks->end(), compare);
}
bool LoadInternetShortcut(
const base::FilePath& file,
Microsoft::WRL::ComPtr<IUniformResourceLocator>* shortcut) {
Microsoft::WRL::ComPtr<IUniformResourceLocator> url_locator;
if (FAILED(::CoCreateInstance(CLSID_InternetShortcut, NULL,
CLSCTX_INPROC_SERVER,
IID_PPV_ARGS(&url_locator))))
return false;
Microsoft::WRL::ComPtr<IPersistFile> persist_file;
if (FAILED(url_locator.As(&persist_file)))
return false;
if (FAILED(persist_file->Load(file.value().c_str(), STGM_READ)))
return false;
std::swap(url_locator, *shortcut);
return true;
}
GURL ReadURLFromInternetShortcut(IUniformResourceLocator* url_locator) {
base::win::ScopedCoMem<wchar_t> url;
return (FAILED(url_locator->GetURL(&url)) || !url)
? GURL()
: GURL(base::as_u16cstr(url));
}
GURL ReadFaviconURLFromInternetShortcut(IUniformResourceLocator* url_locator) {
Microsoft::WRL::ComPtr<IPropertySetStorage> property_set_storage;
if (FAILED(url_locator->QueryInterface(IID_PPV_ARGS(&property_set_storage))))
return GURL();
Microsoft::WRL::ComPtr<IPropertyStorage> property_storage;
if (FAILED(property_set_storage->Open(FMTID_Intshcut, STGM_READ,
&property_storage))) {
return GURL();
}
PROPSPEC properties[] = {{PRSPEC_PROPID, {PID_IS_ICONFILE}}};
base::win::ScopedPropVariant output;
if (FAILED(property_storage->ReadMultiple(1, properties, output.Receive())) ||
output.get().vt != VT_LPWSTR)
return GURL();
return GURL(base::as_u16cstr(output.get().pwszVal));
}
std::optional<std::vector<uint8_t>> ReadFaviconDataFromInternetShortcut(
const base::FilePath& file) {
return base::ReadFileToBytes(
base::FilePath(file.value() + kFaviconStreamName));
}
std::optional<std::vector<uint8_t>> ReadFaviconDataFromCache(
const GURL& favicon_url) {
std::wstring url_wstring(base::UTF8ToWide(favicon_url.spec()));
DWORD info_size = 0;
GetUrlCacheEntryInfoEx(url_wstring.c_str(), NULL, &info_size, NULL, NULL,
NULL, 0);
if (GetLastError() != ERROR_INSUFFICIENT_BUFFER) {
return std::nullopt;
}
std::vector<char> buf(info_size);
INTERNET_CACHE_ENTRY_INFO* cache =
reinterpret_cast<INTERNET_CACHE_ENTRY_INFO*>(&buf[0]);
if (!GetUrlCacheEntryInfoEx(url_wstring.c_str(), cache, &info_size, NULL,
NULL, NULL, 0)) {
return std::nullopt;
}
return base::ReadFileToBytes(base::FilePath(cache->lpszLocalFileName));
}
std::optional<std::vector<uint8_t>> ReadReencodedFaviconData(
const base::FilePath& file,
const GURL& favicon_url) {
std::optional<std::vector<uint8_t>> image_data =
ReadFaviconDataFromInternetShortcut(file);
if (!image_data) {
image_data = ReadFaviconDataFromCache(favicon_url);
if (!image_data) {
return std::nullopt;
}
}
return importer::ReencodeFavicon(image_data.value());
}
void UpdateFaviconMap(
const base::FilePath& url_file,
const GURL& url,
IUniformResourceLocator* url_locator,
std::map<GURL, favicon_base::FaviconUsageData>* favicon_map) {
GURL favicon_url = ReadFaviconURLFromInternetShortcut(url_locator);
if (!favicon_url.is_valid())
return;
std::map<GURL, favicon_base::FaviconUsageData>::iterator it =
favicon_map->find(favicon_url);
if (it != favicon_map->end()) {
it->second.urls.insert(url);
} else {
std::optional<std::vector<uint8_t>> png_data =
ReadReencodedFaviconData(url_file, favicon_url);
if (png_data) {
favicon_base::FaviconUsageData usage;
usage.png_data = std::move(png_data).value();
usage.favicon_url = favicon_url;
usage.urls.insert(url);
favicon_map->insert(std::make_pair(favicon_url, usage));
}
}
}
}
const GUID IEImporter::kPStoreAutocompleteGUID = {
0xe161255a,
0x37c3,
0x11d2,
{0xbc, 0xaa, 0x00, 0xc0, 0x4f, 0xd9, 0x29, 0xdb}};
const GUID IEImporter::kUnittestGUID = {
0xa79029d6,
0x753e,
0x4e27,
{0xb8, 0x7, 0x3d, 0x46, 0xab, 0x15, 0x45, 0xdf}};
IEImporter::IEImporter() : edge_import_mode_(false) {}
void IEImporter::StartImport(
const user_data_importer::SourceProfile& source_profile,
uint16_t items,
ImporterBridge* bridge) {
edge_import_mode_ =
source_profile.importer_type == user_data_importer::TYPE_EDGE;
bridge_ = bridge;
if (edge_import_mode_) {
DCHECK_EQ(items, user_data_importer::FAVORITES);
items = user_data_importer::FAVORITES;
}
source_path_ = source_profile.source_path;
bridge_->NotifyStarted();
if ((items & user_data_importer::HOME_PAGE) && !cancelled()) {
bridge_->NotifyItemStarted(user_data_importer::HOME_PAGE);
ImportHomepage();
bridge_->NotifyItemEnded(user_data_importer::HOME_PAGE);
}
if ((items & user_data_importer::HISTORY) && !cancelled()) {
bridge_->NotifyItemStarted(user_data_importer::HISTORY);
ImportHistory();
bridge_->NotifyItemEnded(user_data_importer::HISTORY);
}
if ((items & user_data_importer::FAVORITES) && !cancelled()) {
bridge_->NotifyItemStarted(user_data_importer::FAVORITES);
ImportFavorites();
bridge_->NotifyItemEnded(user_data_importer::FAVORITES);
}
if ((items & user_data_importer::SEARCH_ENGINES) && !cancelled()) {
bridge_->NotifyItemStarted(user_data_importer::SEARCH_ENGINES);
ImportSearchEngines();
bridge_->NotifyItemEnded(user_data_importer::SEARCH_ENGINES);
}
bridge_->NotifyEnded();
}
IEImporter::~IEImporter() = default;
void IEImporter::ImportFavorites() {
FavoritesInfo info;
if (!GetFavoritesInfo(&info))
return;
BookmarkVector bookmarks;
favicon_base::FaviconUsageDataList favicons;
ParseFavoritesFolder(info, &bookmarks, &favicons);
if (!bookmarks.empty() && !cancelled()) {
const std::u16string& first_folder_name =
edge_import_mode_
? l10n_util::GetStringUTF16(IDS_BOOKMARK_GROUP_FROM_EDGE)
: l10n_util::GetStringUTF16(IDS_BOOKMARK_GROUP_FROM_IE);
bridge_->AddBookmarks(bookmarks, first_folder_name);
}
if (!favicons.empty() && !cancelled())
bridge_->SetFavicons(favicons);
}
void IEImporter::ImportHistory() {
const std::string kSchemes[] = {url::kHttpScheme, url::kHttpsScheme,
url::kFtpScheme, url::kFileScheme};
Microsoft::WRL::ComPtr<IUrlHistoryStg2> url_history_stg2;
if (FAILED(::CoCreateInstance(CLSID_CUrlHistory, NULL, CLSCTX_INPROC_SERVER,
IID_PPV_ARGS(&url_history_stg2)))) {
return;
}
Microsoft::WRL::ComPtr<IEnumSTATURL> enum_url;
if (SUCCEEDED(url_history_stg2->EnumUrls(&enum_url))) {
std::vector<user_data_importer::ImporterURLRow> rows;
STATURL stat_url;
enum_url->SetFilter(L"", STATURL_QUERYFLAG_TOPLEVEL);
while (!cancelled() && enum_url->Next(1, &stat_url, NULL) == S_OK) {
std::wstring url_string;
if (stat_url.pwcsUrl) {
url_string = stat_url.pwcsUrl;
CoTaskMemFree(stat_url.pwcsUrl);
}
std::wstring title_string;
if (stat_url.pwcsTitle) {
title_string = stat_url.pwcsTitle;
CoTaskMemFree(stat_url.pwcsTitle);
}
GURL url(base::AsStringPiece16(url_string));
if (!url.is_valid() || !base::Contains(kSchemes, url.GetScheme())) {
continue;
}
user_data_importer::ImporterURLRow row(url);
row.title = base::AsString16(title_string);
row.last_visit = base::Time::FromFileTime(stat_url.ftLastVisited);
if (stat_url.dwFlags == STATURLFLAG_ISTOPLEVEL) {
row.visit_count = 1;
row.hidden = false;
} else {
DCHECK(!stat_url.dwFlags);
row.hidden = true;
}
rows.push_back(row);
}
if (!cancelled()) {
bridge_->SetHistoryItems(rows,
user_data_importer::VISIT_SOURCE_IE_IMPORTED);
}
}
}
void IEImporter::ImportSearchEngines() {
typedef std::map<std::string, std::u16string> SearchEnginesMap;
SearchEnginesMap search_engines_map;
for (base::win::RegistryKeyIterator key_iter(HKEY_CURRENT_USER,
kSearchScopePath);
key_iter.Valid(); ++key_iter) {
std::wstring sub_key_name = kSearchScopePath;
sub_key_name.append(L"\\").append(key_iter.Name());
base::win::RegKey sub_key(HKEY_CURRENT_USER, sub_key_name.c_str(),
KEY_READ);
std::wstring wide_url;
if ((sub_key.ReadValue(L"URL", &wide_url) != ERROR_SUCCESS) ||
wide_url.empty()) {
VLOG(1) << "No URL for IE search engine at " << key_iter.Name();
continue;
}
std::wstring name;
if ((sub_key.ReadValue(NULL, &name) != ERROR_SUCCESS) || name.empty()) {
if ((sub_key.ReadValue(L"DisplayName", &name) != ERROR_SUCCESS) ||
name.empty()) {
VLOG(1) << "No name for IE search engine at " << key_iter.Name();
continue;
}
}
std::string url(base::WideToUTF8(wide_url));
SearchEnginesMap::iterator t_iter = search_engines_map.find(url);
if (t_iter == search_engines_map.end()) {
GURL gurl(url);
if (gurl.is_valid())
t_iter = search_engines_map.emplace(url, base::AsString16(name)).first;
}
}
std::vector<user_data_importer::SearchEngineInfo> search_engines;
for (SearchEnginesMap::iterator i = search_engines_map.begin();
i != search_engines_map.end(); ++i) {
user_data_importer::SearchEngineInfo search_engine_info;
search_engine_info.url = base::UTF8ToUTF16(i->first);
search_engine_info.display_name = i->second;
search_engines.push_back(search_engine_info);
}
bridge_->SetKeywords(search_engines, true);
}
void IEImporter::ImportHomepage() {
static constexpr wchar_t kIEHomepage[] = L"Start Page";
static constexpr wchar_t kIEDefaultHomepage[] = L"Default_Page_URL";
std::wstring key_path(importer::GetIESettingsKey());
base::win::RegKey key(HKEY_CURRENT_USER, key_path.c_str(), KEY_READ);
std::wstring homepage_url;
if (key.ReadValue(kIEHomepage, &homepage_url) != ERROR_SUCCESS ||
homepage_url.empty())
return;
GURL homepage = GURL(base::AsStringPiece16(homepage_url));
if (!homepage.is_valid())
return;
base::win::RegKey keyDefault(HKEY_LOCAL_MACHINE, key_path.c_str(), KEY_READ);
std::wstring default_homepage_url;
LONG result = keyDefault.ReadValue(kIEDefaultHomepage, &default_homepage_url);
if (result == ERROR_SUCCESS && !default_homepage_url.empty()) {
if (homepage.spec() == GURL(base::AsString16(default_homepage_url)).spec())
return;
}
bridge_->AddHomePage(homepage);
}
bool IEImporter::GetFavoritesInfo(IEImporter::FavoritesInfo* info) {
if (!source_path_.empty()) {
info->path = source_path_;
info->path = info->path.AppendASCII("Favorites");
info->links_folder = u"Links";
return true;
}
wchar_t buffer[MAX_PATH];
if (FAILED(SHGetFolderPath(NULL, CSIDL_FAVORITES, NULL, SHGFP_TYPE_CURRENT,
buffer))) {
return false;
}
info->path = base::FilePath(buffer);
info->links_folder = u"Links";
return true;
}
void IEImporter::ParseFavoritesFolder(
const FavoritesInfo& info,
BookmarkVector* bookmarks,
favicon_base::FaviconUsageDataList* favicons) {
base::FilePath file;
std::vector<base::FilePath::StringType> file_list;
base::FilePath favorites_path(info.path);
size_t favorites_path_len =
favorites_path.StripTrailingSeparators().value().size();
base::FileEnumerator file_enumerator(favorites_path, true,
base::FileEnumerator::FILES);
while (!(file = file_enumerator.Next()).value().empty() && !cancelled())
file_list.push_back(file.value());
std::sort(file_list.begin(), file_list.end());
typedef std::map<GURL, favicon_base::FaviconUsageData> FaviconMap;
FaviconMap favicon_map;
for (std::vector<base::FilePath::StringType>::iterator it = file_list.begin();
it != file_list.end(); ++it) {
base::FilePath shortcut(*it);
if (!base::EqualsCaseInsensitiveASCII(shortcut.Extension(), ".url"))
continue;
Microsoft::WRL::ComPtr<IUniformResourceLocator> url_locator;
if (!LoadInternetShortcut(shortcut, &url_locator))
continue;
GURL url = ReadURLFromInternetShortcut(url_locator.Get());
if (!url.is_valid())
continue;
if (url.GetHost() == "go.microsoft.com") {
continue;
}
UpdateFaviconMap(shortcut, url, url_locator.Get(), &favicon_map);
base::FilePath::StringType relative_string =
shortcut.DirName().value().substr(favorites_path_len);
if (!relative_string.empty() &&
base::FilePath::IsSeparator(relative_string[0]))
relative_string = relative_string.substr(1);
base::FilePath relative_path(relative_string);
user_data_importer::ImportedBookmarkEntry entry;
entry.title = shortcut.RemoveExtension().BaseName().AsUTF16Unsafe();
entry.url = url;
entry.creation_time = GetFileCreationTime(shortcut);
if (!relative_path.empty()) {
std::vector<std::wstring> wide_components = relative_path.GetComponents();
std::ranges::transform(wide_components, std::back_inserter(entry.path),
&base::AsString16);
}
if (!entry.path.empty() && entry.path[0] == info.links_folder) {
entry.in_toolbar = true;
}
bookmarks->push_back(entry);
}
if (!edge_import_mode_) {
SortBookmarksInIEOrder(this, bookmarks);
}
for (FaviconMap::iterator iter = favicon_map.begin();
iter != favicon_map.end(); ++iter)
favicons->push_back(iter->second);
}