Skip to content
This repository was archived by the owner on Jun 13, 2023. It is now read-only.

Commit 25edcf9

Browse files
committed
Updates for webarchive-discovery 3.0.0 release.
1 parent bb1d9f1 commit 25edcf9

File tree

5 files changed

+11
-14
lines changed

5 files changed

+11
-14
lines changed

solr/conf/schema.xml

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -28,7 +28,7 @@
2828

2929
<!-- BL UKWA: additional -->
3030
<field name="access_terms" type="string" indexed="true" docValues="true" multiValued="true"/>
31-
<field name="author" type="string" indexed="true" docValues="true"/>
31+
<field name="author" type="string" indexed="true" docValues="true" multiValued="true"/>
3232
<field name="category" type="text_general" indexed="true" stored="true"/>
3333
<field name="collection" type="string" indexed="true" docValues="true" multiValued="true"/>
3434
<field name="collections" type="string" indexed="true" docValues="true" multiValued="true"/>

solr/warclight_warc-indexer.conf

Lines changed: 7 additions & 9 deletions
Original file line numberDiff line numberDiff line change
@@ -4,21 +4,19 @@
44
"http_proxy": {},
55
"solr": {
66
"batch_size": 500,
7-
"num_shards": 1,
87
"dummy_run": false,
9-
"num_threads": 1,
108
"disablecommit": true,
119
"use_hash_url_id": true,
12-
"check_solr_for_duplicates": true,
10+
"check_solr_for_duplicates": false,
1311

1412
"field_setup": {
1513
"fields" : {
16-
"content" : { "max_length" : 512K },
17-
"generator": {"max_length" : 2048 },
18-
"links" : { "max_length" : 2048 },
19-
"links_hosts" : { "max_length" : 2048 },
2014
"url" : { "max_length" : 2048 },
2115
"url_norm" : { "max_length" : 2048 },
16+
"links" : { "max_length" : 2048 },
17+
"links_hosts" : { "max_length" : 2048 },
18+
"content" : { "max_length" : 512K },
19+
"generator": {"max_length" : 2048 },
2220
},
2321
},
2422
},
@@ -53,7 +51,7 @@
5351
"file": "/path/to/exclude.txt"
5452
},
5553
"extract": {
56-
"onDiskThreshold": "500M",
54+
"onDiskThreshold": "1024M",
5755
"response_include": [
5856
"1",
5957
"2",
@@ -74,7 +72,7 @@
7472
"response",
7573
"revisit"
7674
],
77-
"inMemoryThreshold": "500M",
75+
"inMemoryThreshold": "1024M",
7876
"content": {
7977
"text": true,
8078
"text_stored": true,
Lines changed: 1 addition & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -1,2 +1 @@
1-
gem 'blacklight', github: 'projectblacklight/blacklight', branch: 'master'
2-
gem 'blacklight_range_limit', github: 'projectblacklight/blacklight_range_limit', branch: 'blacklight-7'
1+
gem 'blacklight_range_limit', '7.0.0.rc2'

tasks/warclight.rake

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -53,7 +53,7 @@ namespace :warclight do
5353
task :seed do
5454
puts 'Seeding index with data from spec/fixtures/warcs/...'
5555
# rubocop:disable Metrics/LineLength
56-
system('curl -o ".internal_test_gem/tmp/warc-indexer.jar" "http://alpha.library.yorku.ca/warc-indexer-3.0.0-SNAPSHOT-jar-with-dependencies.jar"')
56+
system('curl -o ".internal_test_gem/tmp/warc-indexer.jar" "http://alpha.library.yorku.ca/warc-indexer.jar"')
5757
system('java -Djava.io.tmpdir=.internal_test_gem/tmp -jar .internal_test_gem/tmp/warc-indexer.jar -c .internal_test_gem/solr/warclight_warc-indexer.conf -i "York University Libraries" -n "Test Collection" -u "12345" -s http://localhost:8983/solr/blacklight-core spec/fixtures/warcs/*.gz')
5858
system('curl "http://localhost:8983/solr/blacklight-core/update?commit=true&openSearcher=true"')
5959
end

warclight.gemspec

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -21,7 +21,7 @@ Gem::Specification.new do |s|
2121
s.executables = s.files.grep(%r{^exe/}) { |f| File.basename(f) }
2222
s.require_paths = ['lib']
2323

24-
s.add_dependency 'blacklight'
24+
s.add_dependency 'blacklight', '7.0.0.rc1'
2525
s.add_dependency 'rails', '~> 5.0'
2626

2727
s.add_development_dependency 'bundler', '~> 1.14'

0 commit comments

Comments
 (0)