spec/integration/app-search/crawler_urls_spec.rb (35 lines of code) (raw):
# Licensed to Elasticsearch B.V. under one or more contributor
# license agreements. See the NOTICE file distributed with
# this work for additional information regarding copyright
# ownership. Elasticsearch B.V. licenses this file to you under
# the Apache License, Version 2.0 (the "License"); you may
# not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
# http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing,
# software distributed under the License is distributed on an
# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
# KIND, either express or implied. See the License for the
# specific language governing permissions and limitations
# under the License.
# frozen_string_literal: true
require_relative "#{__dir__}/app_search_helper.rb"
describe Elastic::EnterpriseSearch::AppSearch::Client do
context 'Crawler URLs' do
let(:engine_name) { 'crawler-urls' }
let(:name) { 'https://www.elastic.co' }
before do
create_engine(engine_name)
body = { name: name }
response = client.create_crawler_domain(engine_name, body: body)
@domain = response.body
end
after do
client.delete_engine(engine_name)
sleep 1
end
it 'validates a URL' do
response = client.crawler_url_validation_result(engine_name, url: name)
expect(response.status).to eq 200
expect(response.body['url']).to eq name
expect(response.body['valid']).to eq true
end
it 'extracts content from a URL' do
response = client.crawler_url_extraction_result(engine_name, url: name)
expect(response.status).to eq 200
expect(response.body.keys).to eq(['url', 'normalized_url', 'results'])
end
it 'traces history for a crawler URL' do
response = client.crawler_url_tracing_result(engine_name, url: name)
expect(response.status).to eq 200
expect(response.body['url']).to eq name
expect(response.body['normalized_url']).to eq "#{name}/"
expect(response.body['crawl_requests'])
end
end
end