Class: Crawlscope::Sitemap

Inherits:
Object
  • Object
show all
Defined in:
lib/crawlscope/sitemap.rb

Constant Summary collapse

SITEMAP_NAMESPACE =
{"xmlns" => "http://www.sitemaps.org/schemas/sitemap/0.9"}.freeze

Instance Method Summary collapse

Constructor Details

#initialize(path:, adapter: nil, concurrency: Configuration::DEFAULT_CONCURRENCY, fetch_executor: Configuration::DEFAULT_FETCH_EXECUTOR, timeout_seconds: Configuration::DEFAULT_TIMEOUT_SECONDS) ⇒ Sitemap

Returns a new instance of Sitemap.



12
13
14
15
16
17
18
# File 'lib/crawlscope/sitemap.rb', line 12

def initialize(path:, adapter: nil, concurrency: Configuration::DEFAULT_CONCURRENCY, fetch_executor: Configuration::DEFAULT_FETCH_EXECUTOR, timeout_seconds: Configuration::DEFAULT_TIMEOUT_SECONDS)
  @path = path
  @adapter = adapter
  @concurrency = concurrency
  @fetch_executor = fetch_executor
  @timeout_seconds = timeout_seconds
end

Instance Method Details

#urls(base_url:) ⇒ Object



20
21
22
# File 'lib/crawlscope/sitemap.rb', line 20

def urls(base_url:)
  collect_urls(@path, base_url: base_url, visited: Set.new, visited_mutex: Mutex.new).uniq
end