forked from kamyu104/LeetCode-Solutions
-
Notifications
You must be signed in to change notification settings - Fork 15
/
Copy pathweb-crawler.cpp
35 lines (33 loc) · 1.06 KB
/
web-crawler.cpp
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
// Time: O(|V| + |E|)
// Space: O(|V|)
/**
* // This is the HtmlParser's API interface.
* // You should not implement it, or speculate about its implementation
* class HtmlParser {
* public:
* vector<string> getUrls(string url);
* };
*/
class Solution {
public:
vector<string> crawl(string startUrl, HtmlParser htmlParser) {
vector<string> result = {startUrl};
unordered_set<string> lookup(result.cbegin(), result.cend());
for (int i = 0; i < result.size(); ++i) {
const auto& from_url = result[i];
const auto& name = hostname(from_url);
for (const auto& to_url: htmlParser.getUrls(from_url)) {
if (!lookup.count(to_url) && name == hostname(to_url)) {
result.emplace_back(to_url);
lookup.emplace(to_url);
}
}
}
return result;
}
private:
string hostname(const string& url) {
static const string scheme = "http://";
return url.substr(0, url.find('/', scheme.length()));
}
};