diff --git a/app/graphql/types/query_type.rb b/app/graphql/types/query_type.rb index c0576f2..598213e 100644 --- a/app/graphql/types/query_type.rb +++ b/app/graphql/types/query_type.rb @@ -9,9 +9,18 @@ def ping 'Pong!' end - field :record_id, RecordType, null: false, - description: 'Retrieve one timdex record' do - argument :id, String, required: true + if Flipflop.v2? + field :record_id, RecordType, null: false, + description: 'Retrieve one timdex record' do + argument :id, String, required: true + argument :index, String, required: false, default_value: nil, + description: 'It is not recommended to provide an index value unless we have provided you with one for your specific use case' + end + else + field :record_id, RecordType, null: false, + description: 'Retrieve one timdex record' do + argument :id, String, required: true + end end if Flipflop.v2? @@ -26,8 +35,8 @@ def info end if Flipflop.v2? - def record_id(id:) - result = Retrieve.new.fetch(id, Timdex::OSClient) + def record_id(id:, index:) + result = Retrieve.new.fetch(id, Timdex::OSClient, index) result['hits']['hits'].first['_source'] rescue Elasticsearch::Transport::Transport::Errors::NotFound raise GraphQL::ExecutionError, "Record '#{id}' not found" @@ -44,6 +53,8 @@ def record_id(id:) argument :subjects, String, required: false, default_value: nil argument :title, String, required: false, default_value: nil argument :from, String, required: false, default_value: '0' + argument :index, String, required: false, default_value: nil, + description: 'It is not recommended to provide an index value unless we have provided you with one for your specific use case' # applied facets argument :collection_facet, [String], required: false, default_value: nil @@ -81,11 +92,11 @@ def record_id(id:) if Flipflop.v2? def search(searchterm:, citation:, contributors:, funding_information:, identifiers:, locations:, subjects:, - title:, from:, **facets) + title:, index:, from:, **facets) query = construct_query(searchterm, citation, contributors, funding_information, identifiers, locations, subjects, title, facets) - results = Opensearch.new.search(from, query, Timdex::OSClient) + results = Opensearch.new.search(from, query, Timdex::OSClient, index) response = {} response[:hits] = results['hits']['total']['value'] diff --git a/app/models/opensearch.rb b/app/models/opensearch.rb index e9c74c3..cd32117 100644 --- a/app/models/opensearch.rb +++ b/app/models/opensearch.rb @@ -2,12 +2,17 @@ class Opensearch SIZE = 20 MAX_PAGE = 200 - def search(from, params, client) + def search(from, params, client, index = nil) @params = params - client.search(index: ENV.fetch('ELASTICSEARCH_INDEX', nil), + index = default_index unless index.present? + client.search(index: index, body: build_query(from)) end + def default_index + ENV.fetch('ELASTICSEARCH_INDEX', nil) + end + # Construct the json query to send to elasticsearch def build_query(from) { diff --git a/app/models/retrieve.rb b/app/models/retrieve.rb index a882c53..5778cad 100644 --- a/app/models/retrieve.rb +++ b/app/models/retrieve.rb @@ -1,17 +1,24 @@ class Retrieve - def fetch(id, client) + def fetch(id, client, index = nil) f = to_filter(id) - record = client.search(index: ENV['ELASTICSEARCH_INDEX'], body: f) + + index = default_index unless index.present? + + record = client.search(index: index, body: f) if client.instance_of?(OpenSearch::Client) raise OpenSearch::Transport::Transport::Errors::NotFound if record['hits']['total']['value'].zero? - else - raise Elasticsearch::Transport::Transport::Errors::NotFound if record['hits']['total'].zero? + elsif record['hits']['total'].zero? + raise Elasticsearch::Transport::Transport::Errors::NotFound end record end + def default_index + ENV.fetch('ELASTICSEARCH_INDEX', nil) + end + def to_filter(id) { query: { diff --git a/test/controllers/graphql_controller_v2_test.rb b/test/controllers/graphql_controller_v2_test.rb index d47fecb..b31df6d 100644 --- a/test/controllers/graphql_controller_v2_test.rb +++ b/test/controllers/graphql_controller_v2_test.rb @@ -153,7 +153,7 @@ def setup }' } assert_equal(200, response.status) json = JSON.parse(response.body) - assert json['data']['search']['records'].first['contributors'].any? { |c| c.has_value? 'Moon, Intae' } + assert json['data']['search']['records'].first['contributors'].any? { |c| c.value? 'Moon, Intae' } end end @@ -177,9 +177,9 @@ def setup assert_equal 'A common table : 80 recipes and stories from my shared cultures /', json['data']['search']['records'].first['title'] assert json['data']['search']['records'].first['contributors'].any? { |c| - c.has_value? 'McTernan, Cynthia Chen, author.' + c.value? 'McTernan, Cynthia Chen, author.' } - assert json['data']['search']['records'].first['identifiers'].any? { |i| i.has_value? '163565002X (hardback)' } + assert json['data']['search']['records'].first['identifiers'].any? { |i| i.value? '163565002X (hardback)' } end end @@ -317,7 +317,6 @@ def setup test 'graphqlv2 filter multiple sources' do VCR.use_cassette('graphql v2 filter multiple sources') do - # no filters to return all sources. used later to test filters return less than the total. post '/graphql', params: { query: '{ @@ -330,8 +329,7 @@ def setup } } } - }' - } + }' } json = JSON.parse(response.body) initial_source_array = json['data']['search']['aggregations']['source'] @@ -348,8 +346,7 @@ def setup } } } - }' - } + }' } assert_equal(200, response.status) json = JSON.parse(response.body) @@ -359,14 +356,13 @@ def setup assert_equal(2, filtered_source_array.count) expected_sources = ['zenodo', 'dspace@mit'] - actual_sources = filtered_source_array.map{|source| source["key"]} + actual_sources = filtered_source_array.map { |source| source['key'] } assert_equal(expected_sources, actual_sources) end end test 'graphqlv2 filter single source' do VCR.use_cassette('graphql v2 filter single source') do - # no filters to return all sources. used later to test filters return less than the total. post '/graphql', params: { query: '{ @@ -379,8 +375,7 @@ def setup } } } - }' - } + }' } json = JSON.parse(response.body) initial_source_array = json['data']['search']['aggregations']['source'] @@ -397,8 +392,7 @@ def setup } } } - }' - } + }' } assert_equal(200, response.status) json = JSON.parse(response.body) @@ -408,8 +402,40 @@ def setup assert_equal(1, filtered_source_array.count) expected_sources = ['dspace@mit'] - actual_sources = filtered_source_array.map{|source| source["key"]} + actual_sources = filtered_source_array.map { |source| source['key'] } assert_equal(expected_sources, actual_sources) end end + + test 'graphqlv2 can retrieve a record from a default index' do + # fragile test: specific item expected in default index + VCR.use_cassette('graphql v2 retrieve from default index') do + post '/graphql', params: { query: + '{ + recordId(id: "dspace:1721.1-44968") { + timdexRecordId + title + } + }' } + + json = JSON.parse(response.body) + assert_equal('dspace:1721.1-44968', json['data']['recordId']['timdexRecordId']) + end + end + + test 'graphqlv2 can retrive a record from a specified index' do + # fragile test: specific item expected in specified index + VCR.use_cassette('graphql v2 retrieve from rdi* index') do + post '/graphql', params: { query: + '{ + recordId(id: "zenodo:5728409", index: "rdi*") { + timdexRecordId + title + } + }' } + + json = JSON.parse(response.body) + assert_equal('zenodo:5728409', json['data']['recordId']['timdexRecordId']) + end + end end diff --git a/test/models/opensearch_test.rb b/test/models/opensearch_test.rb index 55f5311..e08013f 100644 --- a/test/models/opensearch_test.rb +++ b/test/models/opensearch_test.rb @@ -59,6 +59,26 @@ class OpensearchTest < ActiveSupport::TestCase assert matches.select { |m| m['subjects.value'] == 'assured' } end + test 'can override index' do + # fragile test: assumes opensearch instance with at least one index prefixed with `rdi` + VCR.use_cassette('opensearch non-default index') do + params = { title: 'data' } + results = Opensearch.new.search(0, params, Timdex::OSClient, 'rdi*') + assert results['hits']['hits'].map { |hit| hit['_index'] }.uniq.map { |index| index.start_with?('rdi') }.any? + end + end + + test 'default index' do + # fragile test: assumes opensearch instance with at least one index promoted to timdex-prod and no promoted indexes + # that start with rdi* + VCR.use_cassette('opensearch default index') do + params = { title: 'data' } + results = Opensearch.new.search(0, params, Timdex::OSClient) + refute results['hits']['hits'].map { |hit| hit['_index'] }.uniq.map { |index| index.start_with?('rdi') }.any? + assert results['hits']['hits'].map { |hit| hit['_index'] }.uniq.any? + end + end + test 'searches a single field' do VCR.use_cassette('opensearch single field') do params = { title: 'spice' } diff --git a/test/vcr_cassettes/graphql_v2_retrieve_from_default_index.yml b/test/vcr_cassettes/graphql_v2_retrieve_from_default_index.yml new file mode 100644 index 0000000..1f0d3c7 --- /dev/null +++ b/test/vcr_cassettes/graphql_v2_retrieve_from_default_index.yml @@ -0,0 +1,96 @@ +--- +http_interactions: +- request: + method: get + uri: http://localhost:9200/ + body: + encoding: US-ASCII + string: '' + headers: + User-Agent: + - 'opensearch-ruby/2.0.0 (RUBY_VERSION: 2.7.6; darwin x86_64; Faraday v1.10.0)' + Content-Type: + - application/json + Accept-Encoding: + - gzip;q=1.0,deflate;q=0.6,identity;q=0.3 + Accept: + - "*/*" + response: + status: + code: 200 + message: OK + headers: + Content-Type: + - application/json; charset=UTF-8 + Content-Length: + - '350' + body: + encoding: ASCII-8BIT + string: | + { + "name" : "e03207b01655", + "cluster_name" : "docker-cluster", + "cluster_uuid" : "9OY_6pKWQKWHQbxorP7qaw", + "version" : { + "distribution" : "opensearch", + "number" : "1.3.0", + "build_type" : "tar", + "build_hash" : "e45991597c86ba1bbcc36ee1dfdc165197a913af", + "build_date" : "2022-03-15T19:07:30.455415Z", + "build_snapshot" : false, + "lucene_version" : "8.10.1", + "minimum_wire_compatibility_version" : "6.8.0", + "minimum_index_compatibility_version" : "6.0.0-beta1" + }, + "tagline" : "The OpenSearch Project: https://opensearch.org/" + } + recorded_at: Wed, 13 Jul 2022 20:10:38 GMT +- request: + method: post + uri: http://localhost:9200/timdex-prod/_search + body: + encoding: UTF-8 + string: '{"query":{"ids":{"values":["dspace:1721.1-44968"]}}}' + headers: + User-Agent: + - 'opensearch-ruby/2.0.0 (RUBY_VERSION: 2.7.6; darwin x86_64; Faraday v1.10.0)' + Content-Type: + - application/json + Accept-Encoding: + - gzip;q=1.0,deflate;q=0.6,identity;q=0.3 + Accept: + - "*/*" + response: + status: + code: 200 + message: OK + headers: + Content-Type: + - application/json; charset=UTF-8 + Content-Length: + - '1037' + body: + encoding: ASCII-8BIT + string: '{"took":3,"timed_out":false,"_shards":{"total":1,"successful":1,"skipped":0,"failed":0},"hits":{"total":{"value":1,"relation":"eq"},"max_score":1.0,"hits":[{"_index":"dspace-2022-07-13t19-23-43z","_type":"_doc","_id":"dspace:1721.1-44968","_score":1.0,"_source":{"citation":"Stoker, + Thomas M. (2000): Panel data analysis of U.S. coal productivity. MIT Center + for Energy and Environmental Policy Research. Working Paper. https://dspace.mit.edu/handle/1721.1/44968","content_type":["Working + Paper"],"contributors":[{"kind":"author","value":"Stoker, Thomas M."},{"kind":"other","value":"Massachusetts + Institute of Technology. Center for Energy and Environmental Policy Research."}],"dates":[{"kind":"Publication + date","value":"2000"}],"file_formats":["application/pdf"],"format":"electronic + resource","identifiers":[{"kind":"uri","value":"http://hdl.handle.net/1721.1/44968"},{"kind":"oclc","value":"52315985"}],"links":[{"kind":"Digital + object URL","text":"Digital object URL","url":"http://hdl.handle.net/1721.1/44968"}],"numbering":"MIT-CEEPR + (Series) ; 00-004WP.","publication_information":["MIT Center for Energy and + Environmental Policy Research"],"source":"DSpace@MIT","source_link":"https://dspace.mit.edu/handle/1721.1/44968","summary":["We + analyze labor productivity in coal mining in the United States using indices + of productivity change associated with the concepts of panel data modeling. + This approach is valuable when there is extensive heterogeneity in production + units, as with coal mines. We find substantial returns to scale for coal mining + in all geographical regions, and find that smooth technical progress is exhibited + by estimates of the fixed effects for coal mining. We carry out a variety + of diagnostic analyses of our basic model and primary modeling assumptions, + using recently proposed methods for addressing ''errors-in-variable'' and + ''weak instrument bias'' problems, as well a new method for studying errors-in-variables + in nonlinear contexts."],"timdex_record_id":"dspace:1721.1-44968","title":"Panel + data analysis of U.S. coal productivity"}}]}}' + recorded_at: Wed, 13 Jul 2022 20:10:39 GMT +recorded_with: VCR 6.1.0 diff --git a/test/vcr_cassettes/graphql_v2_retrieve_from_rdi_index.yml b/test/vcr_cassettes/graphql_v2_retrieve_from_rdi_index.yml new file mode 100644 index 0000000..366efac --- /dev/null +++ b/test/vcr_cassettes/graphql_v2_retrieve_from_rdi_index.yml @@ -0,0 +1,93 @@ +--- +http_interactions: +- request: + method: get + uri: http://localhost:9200/ + body: + encoding: US-ASCII + string: '' + headers: + User-Agent: + - 'opensearch-ruby/2.0.0 (RUBY_VERSION: 2.7.6; darwin x86_64; Faraday v1.10.0)' + Content-Type: + - application/json + Accept-Encoding: + - gzip;q=1.0,deflate;q=0.6,identity;q=0.3 + Accept: + - "*/*" + response: + status: + code: 200 + message: OK + headers: + Content-Type: + - application/json; charset=UTF-8 + Content-Length: + - '350' + body: + encoding: ASCII-8BIT + string: | + { + "name" : "e03207b01655", + "cluster_name" : "docker-cluster", + "cluster_uuid" : "9OY_6pKWQKWHQbxorP7qaw", + "version" : { + "distribution" : "opensearch", + "number" : "1.3.0", + "build_type" : "tar", + "build_hash" : "e45991597c86ba1bbcc36ee1dfdc165197a913af", + "build_date" : "2022-03-15T19:07:30.455415Z", + "build_snapshot" : false, + "lucene_version" : "8.10.1", + "minimum_wire_compatibility_version" : "6.8.0", + "minimum_index_compatibility_version" : "6.0.0-beta1" + }, + "tagline" : "The OpenSearch Project: https://opensearch.org/" + } + recorded_at: Wed, 13 Jul 2022 20:14:01 GMT +- request: + method: post + uri: http://localhost:9200/rdi*/_search + body: + encoding: UTF-8 + string: '{"query":{"ids":{"values":["zenodo:5728409"]}}}' + headers: + User-Agent: + - 'opensearch-ruby/2.0.0 (RUBY_VERSION: 2.7.6; darwin x86_64; Faraday v1.10.0)' + Content-Type: + - application/json + Accept-Encoding: + - gzip;q=1.0,deflate;q=0.6,identity;q=0.3 + Accept: + - "*/*" + response: + status: + code: 200 + message: OK + headers: + Content-Type: + - application/json; charset=UTF-8 + Content-Length: + - '1184' + body: + encoding: ASCII-8BIT + string: '{"took":2,"timed_out":false,"_shards":{"total":3,"successful":3,"skipped":0,"failed":0},"hits":{"total":{"value":1,"relation":"eq"},"max_score":1.0,"hits":[{"_index":"rdizenodo-2022-07-13t19-23-57z","_type":"_doc","_id":"zenodo:5728409","_score":1.0,"_source":{"citation":"Stevens, + Abigail (2021): Data for time series tutorial. Zenodo. Dataset. https://zenodo.org/record/5728409","content_type":["Dataset"],"contributors":[{"affiliation":["Michigan + State Univ. and Univ. of Michigan"],"kind":"Creator","identifier":["https://orcid.org/0000-0002-5041-3079"],"value":"Stevens, + Abigail"}],"dates":[{"kind":"Publication date","value":"2021"},{"kind":"Issued","value":"2021-11-25"}],"format":"electronic + resource","identifiers":[{"kind":"DOI","value":"10.5281/zenodo.5728409"},{"kind":"url","value":"https://zenodo.org/record/5728409"}],"languages":["en"],"notes":[{"kind":"Other","value":["{\"references\": + [\"Wilson-Hodge, C. et al. (2018). \\\"NICER and Fermi GBM Observations of + the First Galactic Ultraluminous X-Ray Pulsar Swift J0243.6+6124,\\\" ApJ, + 863, 9.\", \"Stevens, A.L. et al. (2018). \\\" A NICER Discovery of a Low-frequency + Quasi-periodic Oscillation in the Soft-intermediate State of MAXI J1535-571,\\\" + ApJ, 865, L15.\"]}"]}],"publication_information":["Zenodo"],"related_items":[{"relationship":"IsVersionOf","uri":"https://doi.org/10.5281/zenodo.5728408"},{"relationship":"IsPartOf","uri":"https://zenodo.org/communities/astronomy-general"}],"rights":[{"uri":"https://creativecommons.org/licenses/by/4.0/legalcode"},{"uri":"info:eu-repo/semantics/openAccess"}],"source":"Zenodo","source_link":"https://zenodo.org/record/5728409","subjects":[{"kind":"Subject + scheme not provided","value":["astronomy"]}],"summary":["\u003cp\u003eThese + are sample data files to be used in the time series tutorial found here: \u003ca + href=\"https://github.com/abigailStev/timeseries-tutorial\"\u003ehttps://github.com/abigailStev/timeseries-tutorial + \u003c/a\u003e\u003c/p\u003e\n\n\u003cp\u003eThey are public datasets from + the NICER X-ray Timing Instrument of a black hole, MAXI J1535-571, and a neutron + star, Swift J0243.6+6124. There are also Good Time Intervals I created for + each of the photon event lists.\u003c/p\u003e"],"timdex_record_id":"zenodo:5728409","title":"Data + for time series tutorial"}}]}}' + recorded_at: Wed, 13 Jul 2022 20:14:01 GMT +recorded_with: VCR 6.1.0 diff --git a/test/vcr_cassettes/opensearch_default_index.yml b/test/vcr_cassettes/opensearch_default_index.yml new file mode 100644 index 0000000..15df5ed --- /dev/null +++ b/test/vcr_cassettes/opensearch_default_index.yml @@ -0,0 +1,152 @@ +--- +http_interactions: +- request: + method: get + uri: http://localhost:9200/ + body: + encoding: US-ASCII + string: '' + headers: + User-Agent: + - 'opensearch-ruby/2.0.0 (RUBY_VERSION: 2.7.6; darwin x86_64; Faraday v1.10.0)' + Content-Type: + - application/json + Accept-Encoding: + - gzip;q=1.0,deflate;q=0.6,identity;q=0.3 + Accept: + - "*/*" + response: + status: + code: 200 + message: OK + headers: + Content-Type: + - application/json; charset=UTF-8 + Content-Length: + - '350' + body: + encoding: ASCII-8BIT + string: | + { + "name" : "e03207b01655", + "cluster_name" : "docker-cluster", + "cluster_uuid" : "9OY_6pKWQKWHQbxorP7qaw", + "version" : { + "distribution" : "opensearch", + "number" : "1.3.0", + "build_type" : "tar", + "build_hash" : "e45991597c86ba1bbcc36ee1dfdc165197a913af", + "build_date" : "2022-03-15T19:07:30.455415Z", + "build_snapshot" : false, + "lucene_version" : "8.10.1", + "minimum_wire_compatibility_version" : "6.8.0", + "minimum_index_compatibility_version" : "6.0.0-beta1" + }, + "tagline" : "The OpenSearch Project: https://opensearch.org/" + } + recorded_at: Wed, 13 Jul 2022 19:47:35 GMT +- request: + method: post + uri: http://localhost:9200/timdex-prod/_search + body: + encoding: UTF-8 + string: '{"from":0,"size":20,"query":{"bool":{"should":null,"must":[{"match":{"title":"data"}}],"filter":[]}},"highlight":{"pre_tags":["\u003cspan + class=\"highlight\"\u003e"],"post_tags":["\u003c/span\u003e"],"fields":{"*":{}}},"aggregations":{"collections":{"terms":{"field":"collections.keyword"}},"contributors":{"nested":{"path":"contributors"},"aggs":{"contributor_names":{"terms":{"field":"contributors.value.keyword"}}}},"content_type":{"terms":{"field":"content_type"}},"content_format":{"terms":{"field":"format"}},"languages":{"terms":{"field":"languages.keyword"}},"literary_form":{"terms":{"field":"literary_form"}},"source":{"terms":{"field":"source"}},"subjects":{"nested":{"path":"subjects"},"aggs":{"subject_names":{"terms":{"field":"subjects.value.keyword"}}}}}}' + headers: + User-Agent: + - 'opensearch-ruby/2.0.0 (RUBY_VERSION: 2.7.6; darwin x86_64; Faraday v1.10.0)' + Content-Type: + - application/json + Accept-Encoding: + - gzip;q=1.0,deflate;q=0.6,identity;q=0.3 + Accept: + - "*/*" + response: + status: + code: 200 + message: OK + headers: + Content-Type: + - application/json; charset=UTF-8 + Content-Length: + - '2381' + body: + encoding: ASCII-8BIT + string: '{"took":8,"timed_out":false,"_shards":{"total":1,"successful":1,"skipped":0,"failed":0},"hits":{"total":{"value":3,"relation":"eq"},"max_score":5.2164545,"hits":[{"_index":"dspace-2022-07-13t19-23-43z","_type":"_doc","_id":"dspace:1721.1-44968","_score":5.2164545,"_source":{"citation":"Stoker, + Thomas M. (2000): Panel data analysis of U.S. coal productivity. MIT Center + for Energy and Environmental Policy Research. Working Paper. https://dspace.mit.edu/handle/1721.1/44968","content_type":["Working + Paper"],"contributors":[{"kind":"author","value":"Stoker, Thomas M."},{"kind":"other","value":"Massachusetts + Institute of Technology. Center for Energy and Environmental Policy Research."}],"dates":[{"kind":"Publication + date","value":"2000"}],"file_formats":["application/pdf"],"format":"electronic + resource","identifiers":[{"kind":"uri","value":"http://hdl.handle.net/1721.1/44968"},{"kind":"oclc","value":"52315985"}],"links":[{"kind":"Digital + object URL","text":"Digital object URL","url":"http://hdl.handle.net/1721.1/44968"}],"numbering":"MIT-CEEPR + (Series) ; 00-004WP.","publication_information":["MIT Center for Energy and + Environmental Policy Research"],"source":"DSpace@MIT","source_link":"https://dspace.mit.edu/handle/1721.1/44968","summary":["We + analyze labor productivity in coal mining in the United States using indices + of productivity change associated with the concepts of panel data modeling. + This approach is valuable when there is extensive heterogeneity in production + units, as with coal mines. We find substantial returns to scale for coal mining + in all geographical regions, and find that smooth technical progress is exhibited + by estimates of the fixed effects for coal mining. We carry out a variety + of diagnostic analyses of our basic model and primary modeling assumptions, + using recently proposed methods for addressing ''errors-in-variable'' and + ''weak instrument bias'' problems, as well a new method for studying errors-in-variables + in nonlinear contexts."],"timdex_record_id":"dspace:1721.1-44968","title":"Panel + data analysis of U.S. coal productivity"},"highlight":{"title":["Panel data analysis of U.S. coal productivity"]}},{"_index":"dspace-2022-07-13t19-23-43z","_type":"_doc","_id":"dspace:1721.1-45062","_score":3.5745273,"_source":{"citation":"Ellerman, + A. Denny, Buchner, Barbara (2006): Over-allocation or abatement? : a preliminary + analysis of the EU ETS based on the 2005 emission data. MIT Center for Energy + and Environmental Policy Research. Working Paper. https://dspace.mit.edu/handle/1721.1/45062","content_type":["Working + Paper"],"contributors":[{"kind":"author","value":"Ellerman, A. Denny"},{"kind":"author","value":"Buchner, + Barbara"},{"kind":"other","value":"Massachusetts Institute of Technology. + Center for Energy and Environmental Policy Research."}],"dates":[{"kind":"Publication + date","value":"2006"}],"file_formats":["application/pdf"],"format":"electronic + resource","identifiers":[{"kind":"uri","value":"http://hdl.handle.net/1721.1/45062"},{"kind":"oclc","value":"159935161"}],"links":[{"kind":"Digital + object URL","text":"Digital object URL","url":"http://hdl.handle.net/1721.1/45062"}],"numbering":"MIT-CEEPR + (Series) ; 06-016WP.","publication_information":["MIT Center for Energy and + Environmental Policy Research"],"source":"DSpace@MIT","source_link":"https://dspace.mit.edu/handle/1721.1/45062","summary":["This + paper provides an initial analysis of the EU ETS based on the installation-level + data for verified emissions and allowance allocations in the first trading + year. Those data, released on May 15, 2006, and subsequent updates revealed + that CO2 emissions were about 4% lower than the allocated allowances. The + main objective of the paper is to shed light on the extent to which over-allocation + and abatement have taken place in 2005. We propose a measure by which over-allocation + can be judged and provide estimates of abatement based on emissions data and + indicators of economic activity as well as trends in energy and carbon intensity. + Finally, we discuss the insights and implications that emerge from this tentative + assessment."],"timdex_record_id":"dspace:1721.1-45062","title":"Over-allocation + or abatement? : a preliminary analysis of the EU ETS based on the 2005 emission + data"},"highlight":{"title":[": a preliminary analysis of the EU ETS based + on the 2005 emission data"]}},{"_index":"dspace-2022-07-13t19-23-43z","_type":"_doc","_id":"dspace:1721.1-44986","_score":3.5745273,"_source":{"citation":"Gupta, + Shreekant (2002): Environmental benefits and cost savings through market-based + instruments : an application using state-level data from India. MIT Center + for Energy and Environmental Policy Research. Working Paper. https://dspace.mit.edu/handle/1721.1/44986","content_type":["Working + Paper"],"contributors":[{"kind":"author","value":"Gupta, Shreekant"},{"kind":"other","value":"Massachusetts + Institute of Technology. Center for Energy and Environmental Policy Research."}],"dates":[{"kind":"Publication + date","value":"2002"}],"file_formats":["application/pdf"],"format":"electronic + resource","identifiers":[{"kind":"uri","value":"http://hdl.handle.net/1721.1/44986"},{"kind":"oclc","value":"52305223"}],"links":[{"kind":"Digital + object URL","text":"Digital object URL","url":"http://hdl.handle.net/1721.1/44986"}],"numbering":"MIT-CEEPR + (Series) ; 02-005WP.","publication_information":["MIT Center for Energy and + Environmental Policy Research"],"source":"DSpace@MIT","source_link":"https://dspace.mit.edu/handle/1721.1/44986","summary":["This + paper develops a methodology for estimating potential cost savings from the + use of market-based instruments (MBIs) when local emissions and abatement + cost data are not available. The paper provides estimates of the cost savings + for a 50% reduction of particulate emissions in India''s five main industrial + states, as well as estimates of the benefits from doing so. The estimates + are developed by applying World Bank particulate intensity and abatement cost + factors to sectoral output data. The estimated costs savings range from 26% + to 169% and the benefits are many times greater than the costs even without + the use of MBIs. The paper concludes by commenting on the relative difficulty + of implementing reductions by market-based instruments and conventional command-and-control + regulations."],"timdex_record_id":"dspace:1721.1-44986","title":"Environmental + benefits and cost savings through market-based instruments : an application + using state-level data from India"},"highlight":{"title":["Environmental benefits + and cost savings through market-based instruments : an application using state-level + data"]}}]},"aggregations":{"languages":{"doc_count_error_upper_bound":0,"sum_other_doc_count":0,"buckets":[]},"content_type":{"doc_count_error_upper_bound":0,"sum_other_doc_count":0,"buckets":[{"key":"working + paper","doc_count":3}]},"collections":{"doc_count_error_upper_bound":0,"sum_other_doc_count":0,"buckets":[]},"subjects":{"doc_count":0,"subject_names":{"doc_count_error_upper_bound":0,"sum_other_doc_count":0,"buckets":[]}},"content_format":{"doc_count_error_upper_bound":0,"sum_other_doc_count":0,"buckets":[{"key":"electronic + resource","doc_count":3}]},"literary_form":{"doc_count_error_upper_bound":0,"sum_other_doc_count":0,"buckets":[]},"source":{"doc_count_error_upper_bound":0,"sum_other_doc_count":0,"buckets":[{"key":"dspace@mit","doc_count":3}]},"contributors":{"doc_count":7,"contributor_names":{"doc_count_error_upper_bound":0,"sum_other_doc_count":0,"buckets":[{"key":"massachusetts + institute of technology. center for energy and environmental policy research.","doc_count":3},{"key":"buchner, + barbara","doc_count":1},{"key":"ellerman, a. denny","doc_count":1},{"key":"gupta, + shreekant","doc_count":1},{"key":"stoker, thomas m.","doc_count":1}]}}}}' + recorded_at: Wed, 13 Jul 2022 19:47:35 GMT +recorded_with: VCR 6.1.0 diff --git a/test/vcr_cassettes/opensearch_non-default_index.yml b/test/vcr_cassettes/opensearch_non-default_index.yml new file mode 100644 index 0000000..d36925d --- /dev/null +++ b/test/vcr_cassettes/opensearch_non-default_index.yml @@ -0,0 +1,78 @@ +--- +http_interactions: +- request: + method: get + uri: http://localhost:9200/ + body: + encoding: US-ASCII + string: '' + headers: + User-Agent: + - 'opensearch-ruby/2.0.0 (RUBY_VERSION: 2.7.6; darwin x86_64; Faraday v1.10.0)' + Content-Type: + - application/json + Accept-Encoding: + - gzip;q=1.0,deflate;q=0.6,identity;q=0.3 + Accept: + - "*/*" + response: + status: + code: 200 + message: OK + headers: + Content-Type: + - application/json; charset=UTF-8 + Content-Length: + - '350' + body: + encoding: ASCII-8BIT + string: | + { + "name" : "e03207b01655", + "cluster_name" : "docker-cluster", + "cluster_uuid" : "9OY_6pKWQKWHQbxorP7qaw", + "version" : { + "distribution" : "opensearch", + "number" : "1.3.0", + "build_type" : "tar", + "build_hash" : "e45991597c86ba1bbcc36ee1dfdc165197a913af", + "build_date" : "2022-03-15T19:07:30.455415Z", + "build_snapshot" : false, + "lucene_version" : "8.10.1", + "minimum_wire_compatibility_version" : "6.8.0", + "minimum_index_compatibility_version" : "6.0.0-beta1" + }, + "tagline" : "The OpenSearch Project: https://opensearch.org/" + } + recorded_at: Wed, 13 Jul 2022 19:37:49 GMT +- request: + method: post + uri: http://localhost:9200/rdi*/_search + body: + encoding: UTF-8 + string: '{"from":0,"size":20,"query":{"bool":{"should":null,"must":[{"match":{"title":"data"}}],"filter":[]}},"highlight":{"pre_tags":["\u003cspan + class=\"highlight\"\u003e"],"post_tags":["\u003c/span\u003e"],"fields":{"*":{}}},"aggregations":{"collections":{"terms":{"field":"collections.keyword"}},"contributors":{"nested":{"path":"contributors"},"aggs":{"contributor_names":{"terms":{"field":"contributors.value.keyword"}}}},"content_type":{"terms":{"field":"content_type"}},"content_format":{"terms":{"field":"format"}},"languages":{"terms":{"field":"languages.keyword"}},"literary_form":{"terms":{"field":"literary_form"}},"source":{"terms":{"field":"source"}},"subjects":{"nested":{"path":"subjects"},"aggs":{"subject_names":{"terms":{"field":"subjects.value.keyword"}}}}}}' + headers: + User-Agent: + - 'opensearch-ruby/2.0.0 (RUBY_VERSION: 2.7.6; darwin x86_64; Faraday v1.10.0)' + Content-Type: + - application/json + Accept-Encoding: + - gzip;q=1.0,deflate;q=0.6,identity;q=0.3 + Accept: + - "*/*" + response: + status: + code: 200 + message: OK + headers: + Content-Type: + - application/json; charset=UTF-8 + Content-Length: + - '21415' + body: + encoding: ASCII-8BIT + string: !binary |- + {"took":14,"timed_out":false,"_shards":{"total":3,"successful":3,"skipped":0,"failed":0},"hits":{"total":{"value":127,"relation":"eq"},"max_score":3.6222847,"hits":[{"_index":"rdiwhoas-2022-07-13t19-24-52z","_type":"_doc","_id":"whoas:1912-2338","_score":3.6222847,"_source":{"citation":"Environmental Science \u0026 Technology  42 (2008): 5688-5693","content_type":["Article"],"contributors":[{"kind":"author","value":"Ackerman, Katherine V."},{"kind":"author","value":"Sundquist, Eric T."}],"dates":[{"kind":"accessioned","value":"2008-08-20T14:51:14Z"},{"kind":"available","value":"2008-08-20T14:51:14Z"},{"kind":"Publication date","value":"2008-06-25"}],"file_formats":["application/pdf"],"format":"electronic resource","funding_information":[{"funder_name":"This study was supported by the National Research Program\r\nand the Earth System Dynamics Program of the U.S.\r\nGeological Survey."}],"identifiers":[{"kind":"uri","value":"https://hdl.handle.net/1912/2338"},{"kind":"doi","value":"10.1021/es800221q"}],"languages":["en_US"],"links":[{"kind":"Digital object URL","text":"Digital object URL","url":"https://hdl.handle.net/1912/2338"}],"notes":[{"value":["This paper is not subject to U.S. copyright.  The definitive version was published in Environmental Science \u0026 Technology  42 (2008): 5688-5693, doi:10.1021/es800221q."]}],"publication_information":["Americal Chemical Society"],"related_items":[{"uri":"https://doi.org/10.1021/es800221q"}],"source":"Woods Hole Open Access Server","source_link":"https://darchive.mblwhoilibrary.org/handle/1912/2338","summary":["Estimates of fossil-fuel CO2 emissions are needed to address a variety of climate-change mitigation concerns over a broad range of spatial and temporal scales. We compared two data sets that report power-plant CO2 emissions in the conterminous U.S. for 2004, the most recent year reported in both data sets. The data sets were obtained from the Department of Energy’s Energy Information Administration (EIA) and the Environmental Protection Agency’s eGRID database. Conterminous U.S. total emissions computed from the data sets differed by 3.5% for total plant emissions (electricity plus useful thermal output) and 2.3% for electricity generation only. These differences are well within previous estimates of uncertainty in annual U.S. fossil-fuel emissions. However, the corresponding average absolute differences between estimates of emissions from individual power plants were much larger, 16.9% and 25.3%, respectively. By statistical analysis, we identified several potential sources of differences between EIA and eGRID estimates for individual plants. Estimates that are based partly or entirely on monitoring of stack gases (reported by eGRID only) differed significantly from estimates based on fuel consumption (as reported by EIA). Differences in accounting methods appear to explain differences in estimates for emissions from electricity generation from combined heat and power plants, and for total and electricity generation emissions from plants that burn nonconventional fuels (e.g., biomass). Our analysis suggests the need for care in utilizing emissions data from individual power plants, and the need for transparency in documenting the accounting and monitoring methods used to estimate emissions."],"timdex_record_id":"whoas:1912-2338","title":"Comparison of two U.S. power-plant carbon dioxide emissions data sets"},"highlight":{"title":["Comparison of two U.S. power-plant carbon dioxide emissions <span class=\"highlight\">data</span> sets"]}},{"_index":"rdiwhoas-2022-07-13t19-24-52z","_type":"_doc","_id":"whoas:1912-24879","_score":3.6222847,"_source":{"citation":"Farris, A. S., Defne, Z., \u0026 Ganju, N. K. (2019). Identifying salt marsh shorelines from remotely sensed elevation data and imagery. Remote Sensing, 11(15), 1795.","content_type":["Article"],"contributors":[{"kind":"author","value":"Farris, Amy S."},{"kind":"author","value":"Defne, Zafer"},{"kind":"author","value":"Ganju, Neil K."}],"dates":[{"kind":"accessioned","value":"2019-11-21T20:32:16Z"},{"kind":"available","value":"2019-11-21T20:32:16Z"},{"kind":"Publication date","value":"2019-07-31"}],"format":"electronic resource","funding_information":[{"funder_name":"This project was supported by the U.S. Geological Survey (USGS) Coastal/Marine Natural Hazards and Resources Program as well as the Massachusetts O ce of Coastal Zone Management under interagency agreement 16ENMALQ006000."}],"identifiers":[{"kind":"uri","value":"https://hdl.handle.net/1912/24879"},{"kind":"doi","value":"10.3390/rs11151795"}],"links":[{"kind":"Digital object URL","text":"Digital object URL","url":"https://hdl.handle.net/1912/24879"}],"notes":[{"value":["© The Author(s), 2019. This article is distributed under the terms of the Creative Commons Attribution License. The definitive version was published in Farris, A. S., Defne, Z., \u0026 Ganju, N. K. Identifying salt marsh shorelines from remotely sensed elevation data and imagery. Remote Sensing, 11(15), (2019): 1795, doi: 10.3390/rs11151795."]}],"publication_information":["MDPI"],"related_items":[{"uri":"https://doi.org/10.3390/rs11151795"}],"rights":[{},{"uri":"http://creativecommons.org/licenses/by/4.0/"}],"source":"Woods Hole Open Access Server","source_link":"https://darchive.mblwhoilibrary.org/handle/1912/24879","subjects":[{"kind":"Subject scheme not provided","value":["marsh edge","marsh shoreline","unmanned aircraft system","UAS","UAV","drone","lidar","salt marsh","coastal wetlands","Plum Island"]}],"summary":["Salt marshes are valuable ecosystems that are vulnerable to lateral erosion, submergence, and internal disintegration due to sea level rise, storms, and sediment deficits. Because many salt marshes are losing area in response to these factors, it is important to monitor their lateral extent at high resolution over multiple timescales. In this study we describe two methods to calculate the location of the salt marsh shoreline. The marsh edge from elevation data (MEED) method uses remotely sensed elevation data to calculate an objective proxy for the shoreline of a salt marsh. This proxy is the abrupt change in elevation that usually characterizes the seaward edge of a salt marsh, designated the “marsh scarp.” It is detected as the maximum slope along a cross-shore transect between mean high water and mean tide level. The method was tested using lidar topobathymetric and photogrammetric elevation data from Massachusetts, USA. The other method to calculate the salt marsh shoreline is the marsh edge by image processing (MEIP) method which finds the unvegetated/vegetated line. This method applies image classification techniques to multispectral imagery and elevation datasets for edge detection. The method was tested using aerial imagery and coastal elevation data from the Plum Island Estuary in Massachusetts, USA. Both methods calculate a line that closely follows the edge of vegetation seen in imagery. The two methods were compared to each other using high resolution unmanned aircraft systems (UAS) data, and to a heads-up digitized shoreline. The root-mean-square deviation was 0.6 meters between the two methods, and less than 0.43 meters from the digitized shoreline. The MEIP method was also applied to a lower resolution dataset to investigate the effect of horizontal resolution on the results. Both methods provide an accurate, efficient, and objective way to track salt marsh shorelines with spatially intensive data over large spatial scales, which is necessary to evaluate geomorphic change and wetland vulnerability."],"timdex_record_id":"whoas:1912-24879","title":"Identifying salt marsh shorelines from remotely sensed elevation data and imagery"},"highlight":{"title":["Identifying salt marsh shorelines from remotely sensed elevation <span class=\"highlight\">data</span> and imagery"]}},{"_index":"rdiwhoas-2022-07-13t19-24-52z","_type":"_doc","_id":"whoas:1912-2327","_score":3.6222847,"_source":{"citation":"Geochemistry Geophysics Geosystems 9 (2008): Q07008","content_type":["Article"],"contributors":[{"kind":"author","value":"Lee, Myung W."},{"kind":"author","value":"Waite, William F."}],"dates":[{"kind":"accessioned","value":"2008-08-13T14:50:52Z"},{"kind":"available","value":"2008-08-13T14:50:52Z"},{"kind":"Publication date","value":"2008-07-09"}],"file_formats":["application/pdf"],"format":"electronic resource","identifiers":[{"kind":"uri","value":"https://hdl.handle.net/1912/2327"},{"kind":"doi","value":"10.1029/2008GC002081"}],"languages":["en_US"],"links":[{"kind":"Digital object URL","text":"Digital object URL","url":"https://hdl.handle.net/1912/2327"}],"notes":[{"value":["This paper is not subject to U.S. copyright.  The definitive version was published in Geochemistry Geophysics Geosystems 9 (2008): Q07008, doi:10.1029/2008GC002081."]}],"publication_information":["American Geophysical Union"],"related_items":[{"uri":"https://doi.org/10.1029/2008GC002081"}],"source":"Woods Hole Open Access Server","source_link":"https://darchive.mblwhoilibrary.org/handle/1912/2327","subjects":[{"kind":"Subject scheme not provided","value":["Methane hydrate","Seismic velocity","Hydrate assessment"]}],"summary":["Relating pore-space gas hydrate saturation to sonic velocity data is important for remotely estimating gas hydrate concentration in sediment. In the present study, sonic velocities of gas hydrate–bearing sands are modeled using a three-phase Biot-type theory in which sand, gas hydrate, and pore fluid form three homogeneous, interwoven frameworks. This theory is developed using well log compressional and shear wave velocity data from the Mallik 5L-38 permafrost gas hydrate research well in Canada and applied to well log data from hydrate-bearing sands in the Alaskan permafrost, Gulf of Mexico, and northern Cascadia margin. Velocity-based gas hydrate saturation estimates are in good agreement with Nuclear Magneto Resonance and resistivity log estimates over the complete range of observed gas hydrate saturations."],"timdex_record_id":"whoas:1912-2327","title":"Estimating pore-space gas hydrate saturations from well log acoustic data"},"highlight":{"title":["Estimating pore-space gas hydrate saturations from well log acoustic <span class=\"highlight\">data</span>"]}},{"_index":"rdiwhoas-2022-07-13t19-24-52z","_type":"_doc","_id":"whoas:1912-24304","_score":3.6222847,"_source":{"citation":"Signell, R. P., \u0026 Pothina, D. (2019). Analysis and visualization of coastal ocean model data in the cloud. Journal of Marine Science and Engineering, 7(4), 110","content_type":["Article"],"contributors":[{"kind":"author","value":"Signell, Richard P."},{"kind":"author","value":"Pothina, Dharhas"}],"dates":[{"kind":"accessioned","value":"2019-07-01T19:10:36Z"},{"kind":"available","value":"2019-07-01T19:10:36Z"},{"kind":"Publication date","value":"2019-04-19"}],"format":"electronic resource","funding_information":[{"funder_name":"This research benefited from National Science Foundation grant number 1740648, and EarthSim project was funded by ERDC projects PETTT BY17-094SP and PETTT BY16-091SP. This project also benefited from research credits granted by Amazon."}],"identifiers":[{"kind":"uri","value":"https://hdl.handle.net/1912/24304"},{"kind":"doi","value":"10.3390/jmse7040110"}],"links":[{"kind":"Digital object URL","text":"Digital object URL","url":"https://hdl.handle.net/1912/24304"}],"notes":[{"value":["© The Author(s), 2019. This article is distributed under the terms of the Creative Commons Attribution License. The definitive version was published in Signell, R. P., \u0026 Pothina, D.  Analysis and visualization of coastal ocean model data in the cloud. Journal of Marine Science and Engineering, 7(4), (2019);110, doi:10.3390/jmse7040110."]}],"publication_information":["MDPI"],"related_items":[{"uri":"https://doi.org/10.3390/jmse7040110"}],"rights":[{},{"uri":"http://creativecommons.org/licenses/by/4.0/"}],"source":"Woods Hole Open Access Server","source_link":"https://darchive.mblwhoilibrary.org/handle/1912/24304","subjects":[{"kind":"Subject scheme not provided","value":["ocean modeling","cloud computing","data analysis","geospatial data visualization"]}],"summary":["The traditional flow of coastal ocean model data is from High-Performance Computing (HPC) centers to the local desktop, or to a file server where just the needed data can be extracted via services such as OPeNDAP. Analysis and visualization are then conducted using local hardware and software. This requires moving large amounts of data across the internet as well as acquiring and maintaining local hardware, software, and support personnel. Further, as data sets increase in size, the traditional workflow may not be scalable. Alternatively, recent advances make it possible to move data from HPC to the Cloud and perform interactive, scalable, data-proximate analysis and visualization, with simply a web browser user interface. We use the framework advanced by the NSF-funded Pangeo project, a free, open-source Python system which provides multi-user login via JupyterHub and parallel analysis via Dask, both running in Docker containers orchestrated by Kubernetes. Data are stored in the Zarr format, a Cloud-friendly n-dimensional array format that allows performant extraction of data by anyone without relying on data services like OPeNDAP. Interactive visual exploration of data on complex, large model grids is made possible by new tools in the Python PyViz ecosystem, which can render maps at screen resolution, dynamically updating on pan and zoom operations. Two examples are given: (1) Calculating the maximum water level at each grid cell from a 53-GB, 720-time-step, 9-million-node triangular mesh ADCIRC simulation of Hurricane Ike; (2) Creating a dashboard for visualizing data from a curvilinear orthogonal COAWST/ROMS forecast model."],"timdex_record_id":"whoas:1912-24304","title":"Analysis and visualization of coastal ocean model data in the cloud."},"highlight":{"title":["Analysis and visualization of coastal ocean model <span class=\"highlight\">data</span> in the cloud."]}},{"_index":"rdiwhoas-2022-07-13t19-24-52z","_type":"_doc","_id":"whoas:1912-2252","_score":3.5113416,"_source":{"citation":"Goff, John A., Jenkins, Chris J., Williams, S. Jeffress (2007-03): Seabed mapping and characterization of sediment variability using the usSEABED data base. Preprint. https://darchive.mblwhoilibrary.org/handle/1912/2252","content_type":["Preprint"],"contributors":[{"kind":"author","value":"Goff, John A."},{"kind":"author","value":"Jenkins, Chris J."},{"kind":"author","value":"Williams, S. Jeffress"}],"dates":[{"kind":"accessioned","value":"2008-06-06T19:32:39Z"},{"kind":"available","value":"2008-06-06T19:32:39Z"},{"kind":"Publication date","value":"2007-03"}],"file_formats":["application/pdf"],"format":"electronic resource","funding_information":[{"funder_name":"The authors thank the Office of Naval Research for support under grants\r\nN00014-05-1-0079 (JAG) and N00014-05-1-0080 (CJJ), and the USGS/Coastal and Marine\r\nGeology Program (SJW)."}],"identifiers":[{"kind":"uri","value":"https://hdl.handle.net/1912/2252"}],"languages":["en_US"],"links":[{"kind":"Digital object URL","text":"Digital object URL","url":"https://hdl.handle.net/1912/2252"}],"notes":[{"value":["Author Posting. © The Author(s), 2007.  This is the author's version of the work. It is posted here by permission of Elsevier B.V. for personal use, not for redistribution.  The definitive version was published in Continental Shelf Research 28 (2008): 614-633, doi:10.1016/j.csr.2007.11.011."]}],"related_items":[{"uri":"https://doi.org/10.1016/j.csr.2007.11.011"}],"source":"Woods Hole Open Access Server","source_link":"https://darchive.mblwhoilibrary.org/handle/1912/2252","subjects":[{"kind":"Subject scheme not provided","value":["Grain size","Continental shelf","Database","Semivariogram","Statistical analysis","Kriging"]}],"summary":["We present a methodology for statistical analysis of randomly-located marine\r\nsediment point data, and apply it to the U.S. continental shelf portions of usSEABED mean grain\r\nsize records. The usSEABED database, like many modern, large environmental datasets, is\r\nheterogeneous and interdisciplinary. We statistically test the database as a source of mean grain\r\nsize data, and from it provide a first examination of regional seafloor sediment variability across\r\nthe entire US continental shelf. Data derived from laboratory analyses (“extracted”) and from\r\nword-based descriptions (“parsed”) are treated separately, and they are compared statistically and deterministically. Data records are selected for spatial analysis by their location within sample\r\nregions: polygonal areas defined in ArcGIS chosen by geography, water depth, and data\r\nsufficiency. We derive isotropic, binned semivariograms from the data, and invert these for\r\nestimates of noise variance, field variance, and decorrelation distance. The highly erratic nature\r\nof the semivariograms is a result both of the random locations of the data and of the high level of\r\ndata uncertainty (noise). This decorrelates the data covariance matrix for the inversion, and\r\nlargely prevents robust estimation of the fractal dimension. Our comparison of the extracted and\r\nparsed mean grain size data demonstrates important differences between the two. In particular,\r\nextracted measurements generally produce finer mean grain sizes, lower noise variance, and\r\nlower field variance than parsed values. Such relationships can be used to derive a regionallydependent\r\nconversion factor between the two. Our analysis of sample regions on the U.S.\r\ncontinental shelf revealed considerable geographic variability in the estimated statistical\r\nparameters of field variance and decorrelation distance. Some regional relationships are evident,\r\nand overall there is a tendency for field variance to be higher where the average mean grain size\r\nis finer grained. Surprisingly, parsed and extracted noise magnitudes correlate with each other,\r\nwhich may indicate that some portion of the data variability that we identify as “noise” is caused\r\nby real grain size variability at very short scales. Our analyses demonstrate that by applying a\r\nbias-correction proxy, usSEABED data can be used to generate reliable interpolated maps of\r\nregional mean grain size and sediment character."],"timdex_record_id":"whoas:1912-2252","title":"Seabed mapping and characterization of sediment variability using the usSEABED data base"},"highlight":{"title":["Seabed mapping and characterization of sediment variability using the usSEABED <span class=\"highlight\">data</span> base"]}},{"_index":"rdiwhoas-2022-07-13t19-24-52z","_type":"_doc","_id":"whoas:1912-8605","_score":3.5113416,"_source":{"citation":"PLoS ONE 11 (2016): e0164979","content_type":["Article"],"contributors":[{"kind":"author","value":"Thieler, E. Robert"},{"kind":"author","value":"Zeigler, Sara L."},{"kind":"author","value":"Winslow, Luke A."},{"kind":"author","value":"Hines, Megan K."},{"kind":"author","value":"Read, Jordan S."},{"kind":"author","value":"Walker, Jordan I."}],"dates":[{"kind":"accessioned","value":"2016-12-20T19:33:34Z"},{"kind":"available","value":"2016-12-20T19:33:34Z"},{"kind":"Publication date","value":"2016-11-09"}],"format":"electronic resource","funding_information":[{"funder_name":"This work was supported by the North Atlantic Landscape Conservation Cooperative through the U.S. Department of the Interior Hurricane Sandy recovery program under the Disaster Relief Appropriations Act of 2013, and the U.S. Geological Survey Coastal and Marine Geology Program."}],"identifiers":[{"kind":"uri","value":"https://hdl.handle.net/1912/8605"},{"kind":"doi","value":"10.1371/journal.pone.0164979"}],"languages":["en_US"],"links":[{"kind":"Digital object URL","text":"Digital object URL","url":"https://hdl.handle.net/1912/8605"}],"notes":[{"value":["This is an open access article, free of all copyright. The definitive version was published in PLoS ONE 11 (2016): e0164979, doi: 10.1371/journal.pone.0164979."]}],"publication_information":["Public Library of Science"],"related_items":[{"description":"https://doi.org/10.5066/F70V89X3","relationship":"haspart"},{"uri":"https://doi.org/10.1371/journal.pone.0164979"}],"rights":[{},{"uri":"http://creativecommons.org/publicdomain/zero/1.0/"}],"source":"Woods Hole Open Access Server","source_link":"https://darchive.mblwhoilibrary.org/handle/1912/8605","summary":["Understanding and managing dynamic coastal landscapes for beach-dependent species requires biological and geological data across the range of relevant environments and habitats. It is difficult to acquire such information; data often have limited focus due to resource constraints, are collected by non-specialists, or lack observational uniformity. We developed an open-source smartphone application called iPlover that addresses these difficulties in collecting biogeomorphic information at piping plover (Charadrius melodus) nest sites on coastal beaches. This paper describes iPlover development and evaluates data quality and utility following two years of collection (n = 1799 data points over 1500 km of coast between Maine and North Carolina, USA). We found strong agreement between field user and expert assessments and high model skill when data were used for habitat suitability prediction. Methods used here to develop and deploy a distributed data collection system have broad applicability to interdisciplinary environmental monitoring and modeling."],"timdex_record_id":"whoas:1912-8605","title":"Smartphone-based distributed data collection enables rapid assessment of shorebird habitat suitability"},"highlight":{"title":["Smartphone-based distributed <span class=\"highlight\">data</span> collection enables rapid assessment of shorebird habitat suitability"]}},{"_index":"rdiwhoas-2022-07-13t19-24-52z","_type":"_doc","_id":"whoas:1912-2241","_score":3.4069924,"_source":{"citation":"Computers \u0026 Geosciences 34 (2008): 561-565","content_type":["Article"],"contributors":[{"kind":"author","value":"Poppe, Lawrence J."},{"kind":"author","value":"Eliason, Andrew H."}],"dates":[{"kind":"accessioned","value":"2008-05-28T16:15:21Z"},{"kind":"available","value":"2008-05-28T16:15:21Z"},{"kind":"Publication date","value":"2007-11-07"}],"file_formats":["application/pdf","application/zip"],"format":"electronic resource","identifiers":[{"kind":"uri","value":"https://hdl.handle.net/1912/2241"},{"kind":"doi","value":"10.1016/j.cageo.2007.03.019"}],"languages":["en_US"],"links":[{"kind":"Digital object URL","text":"Digital object URL","url":"https://hdl.handle.net/1912/2241"}],"notes":[{"value":["This paper is not subject to U.S. copyright.  The definitive version was published in Computers \u0026 Geosciences 34 (2008): 561-565, doi:10.1016/j.cageo.2007.03.019."]}],"publication_information":["Elsevier B.V."],"related_items":[{"uri":"https://doi.org/10.1016/j.cageo.2007.03.019"}],"source":"Woods Hole Open Access Server","source_link":"https://darchive.mblwhoilibrary.org/handle/1912/2241","subjects":[{"kind":"Subject scheme not provided","value":["Software","Program","Visual Basic","Data processing","Ternary diagrams","Sediment","Plotting"]}],"summary":["Sedimentologic datasets are typically large and compiled into tables or databases, but pure numerical information can be difficult to understand and interpret. Thus, scientists commonly use graphical representations to reduce complexities, recognize trends and patterns in the data, and develop hypotheses. Of the graphical techniques, one of the most common methods used by sedimentologists is to plot the basic gravel, sand, silt, and clay percentages on equilateral triangular diagrams. This means of presenting data is simple and facilitates rapid classification of sediments and comparison of samples."],"timdex_record_id":"whoas:1912-2241","title":"A Visual Basic program to plot sediment grain-size data on ternary diagrams"},"highlight":{"title":["A Visual Basic program to plot sediment grain-size <span class=\"highlight\">data</span> on ternary diagrams"]}},{"_index":"rdiwhoas-2022-07-13t19-24-52z","_type":"_doc","_id":"whoas:1912-28021","_score":3.4069924,"_source":{"citation":"Uhran, B., Windham-Myers, L., Bliss, N., Nahlik, A. M., Sundquist, E., \u0026 Stagg, C. L. (2021). Improved wetland soil organic carbon stocks of the conterminous U.S. through data harmonization. Frontiers in Soil Science, 1, 706701.","content_type":["Article"],"contributors":[{"kind":"author","value":"Uhran, Bergit"},{"kind":"author","value":"Windham-Myers, Lisamarie"},{"kind":"author","value":"Bliss, Norman B."},{"kind":"author","value":"Nahlik, Amanda M."},{"kind":"author","value":"Sundquist, Eric T."},{"kind":"author","value":"Stagg, Camille L."}],"dates":[{"kind":"accessioned","value":"2022-02-16T20:35:58Z"},{"kind":"available","value":"2022-02-16T20:35:58Z"},{"kind":"Publication date","value":"2021-10-12"}],"format":"electronic resource","funding_information":[{"funder_name":"This project was funded through the U.S. Geological Survey's Land Carbon Program and a grant to ES through the U.S. Geological Survey's Community for Data Integration Program for generating cross-agency assessments."}],"identifiers":[{"kind":"uri","value":"https://hdl.handle.net/1912/28021"},{"kind":"doi","value":"10.3389/fsoil.2021.706701"}],"links":[{"kind":"Digital object URL","text":"Digital object URL","url":"https://hdl.handle.net/1912/28021"}],"notes":[{"value":["© The Author(s), 2021. This article is distributed under the terms of the Creative Commons Attribution License. The definitive version was published in Uhran, B., Windham-Myers, L., Bliss, N., Nahlik, A. M., Sundquist, E., \u0026 Stagg, C. L.  Improved wetland soil organic carbon stocks of the conterminous U.S. through data harmonization. Frontiers in Soil Science, 1, (2021): 706701, https://doi.org/10.3389/fsoil.2021.706701."]}],"publication_information":["Frontiers Media"],"related_items":[{"uri":"https://doi.org/10.3389/fsoil.2021.706701"}],"rights":[{},{"uri":"http://creativecommons.org/licenses/by/4.0/"}],"source":"Woods Hole Open Access Server","source_link":"https://darchive.mblwhoilibrary.org/handle/1912/28021","subjects":[{"kind":"Subject scheme not provided","value":["soil organic carbon","soil carbon density","wetland","organic matter","soil profile","soil carbon stock vulnerability"]}],"summary":["Wetland soil stocks are important global repositories of carbon (C) but are difficult to quantify and model due to varying sampling protocols, and geomorphic/spatio-temporal discontinuity. Merging scales of soil-survey spatial extents with wetland-specific point-based data offers an explicit, empirical and updatable improvement for regional and continental scale soil C stock assessments. Agency-collected and community-contributed soil datasets were compared for representativeness and bias, with the goal of producing a harmonized national map of wetland soil C stocks with error quantification for wetland areas of the conterminous United States (CONUS) identified by the USGS National Landcover Change Dataset. This allowed an empirical predictive model of SOC density to be applied across the entire CONUS using relational %OC distribution alone. A broken-stick quantile-regression model identified %OC with its relatively high analytical confidence as a key predictor of SOC density in soil segments; soils \u003c6% OC (hereafter, mineral wetland soils, 85% of the dataset) had a strong linear relationship of %OC to SOC density (RMSE = 0.0059, ~4% mean RMSE) and soils \u003e6% OC (organic wetland soils, 15% of the dataset) had virtually no predictive relationship of %OC to SOC density (RMSE = 0.0348 g C cm−3, ~56% mean RMSE). Disaggregation by vegetation type or region did not alter the breakpoint significantly (6% OC) and did not improve model accuracies for inland and tidal wetlands. Similarly, SOC stocks in tidal wetlands were related to %OC, but without a mappable product for disaggregation to improve accuracy by soil class, region or depth. Our layered harmonized CONUS wetland soil maps revised wetland SOC stock estimates downward by 24% (9.5 vs. 12.5Pg C) with the overestimation being entirely an issue of inland organic wetland soils (35% lower than SSURGO-derived SOC stocks). Further, SSURGO underestimated soil carbon stocks at depth, as modeled wetland SOC stocks for organic-rich soils showed significant preservation downcore in the NWCA dataset (\u003c3% loss between 0 and 30 cm and 30 and 100 cm depths) in contrast to mineral-rich soils (37% downcore stock loss). Future CONUS wetland soil C assessments will benefit from focused attention on improved organic wetland soil measurements, land history, and spatial representativeness."],"timdex_record_id":"whoas:1912-28021","title":"Improved wetland soil organic carbon stocks of the conterminous U.S. through data harmonization"},"highlight":{"title":["Improved wetland soil organic carbon stocks of the conterminous U.S. through <span class=\"highlight\">data</span> harmonization"]}},{"_index":"rdiwhoas-2022-07-13t19-24-52z","_type":"_doc","_id":"whoas:1912-24316","_score":3.2158566,"_source":{"citation":"Vance, T. C., Wengren, M., Burger, E., Hernandez, D., Kearns, T., Medina-Lopez, E., Merati, N., O'Brien, K., O'Neil, J., Potemrag, J. T., Signell, R. P., \u0026 Wilcox, K. (2019). From the oceans to the cloud: Opportunities and challenges for data, models, computation and workflows. Frontiers in Marine Science, 6, 211.","content_type":["Article"],"contributors":[{"kind":"author","value":"Vance, Tiffany C."},{"kind":"author","value":"Wengren, Micah"},{"kind":"author","value":"Burger, Eugene"},{"kind":"author","value":"Hernandez, Debra"},{"kind":"author","value":"Kearns, Timothy"},{"kind":"author","value":"Medina-Lopez, Encarni"},{"kind":"author","value":"Merati, Nazila"},{"kind":"author","value":"O'Brien, Kevin"},{"kind":"author","value":"O’Neil, Jon"},{"kind":"author","value":"Potemra, James T."},{"kind":"author","value":"Signell, Richard P."},{"kind":"author","value":"Wilcox, Kyle"}],"dates":[{"kind":"accessioned","value":"2019-07-05T18:20:49Z"},{"kind":"available","value":"2019-07-05T18:20:49Z"},{"kind":"Publication date","value":"2019-05-21"}],"format":"electronic resource","funding_information":[{"funder_name":"This is PMEL contribution 4873."}],"identifiers":[{"kind":"uri","value":"https://hdl.handle.net/1912/24316"},{"kind":"doi","value":"10.3389/fmars.2019.00211"}],"links":[{"kind":"Digital object URL","text":"Digital object URL","url":"https://hdl.handle.net/1912/24316"}],"notes":[{"value":["© The Author(s), 2019. This article is distributed under the terms of the Creative Commons Attribution License. The definitive version was published in Vance, T. C., Wengren, M., Burger, E., Hernandez, D., Kearns, T., Medina-Lopez, E., Merati, N., O'Brien, K., O'Neil, J., Potemrag, J. T., Signell, R. P., \u0026 Wilcox, K. From the oceans to the cloud: Opportunities and challenges for data, models, computation and workflows. Frontiers in Marine Science, 6(211), (2019), doi:10.3389/fmars.2019.00211."]}],"publication_information":["Frontiers Media"],"related_items":[{"uri":"https://doi.org/10.3389/fmars.2019.00211"}],"rights":[{},{"uri":"http://creativecommons.org/licenses/by/4.0/"}],"source":"Woods Hole Open Access Server","source_link":"https://darchive.mblwhoilibrary.org/handle/1912/24316","subjects":[{"kind":"Subject scheme not provided","value":["ocean observation","ocean modeling and prediction","cloud","data management","archiving","technology"]}],"summary":["Advances in ocean observations and models mean increasing flows of data. Integrating observations between disciplines over spatial scales from regional to global presents challenges. Running ocean models and managing the results is computationally demanding. The rise of cloud computing presents an opportunity to rethink traditional approaches. This includes developing shared data processing workflows utilizing common, adaptable software to handle data ingest and storage, and an associated framework to manage and execute downstream modeling. Working in the cloud presents challenges: migration of legacy technologies and processes, cloud-to-cloud interoperability, and the translation of legislative and bureaucratic requirements for “on-premises” systems to the cloud. To respond to the scientific and societal needs of a fit-for-purpose ocean observing system, and to maximize the benefits of more integrated observing, research on utilizing cloud infrastructures for sharing data and models is underway. Cloud platforms and the services/APIs they provide offer new ways for scientists to observe and predict the ocean’s state. High-performance mass storage of observational data, coupled with on-demand computing to run model simulations in close proximity to the data, tools to manage workflows, and a framework to share and collaborate, enables a more flexible and adaptable observation and prediction computing architecture. Model outputs are stored in the cloud and researchers either download subsets for their interest/area or feed them into their own simulations without leaving the cloud. Expanded storage and computing capabilities make it easier to create, analyze, and distribute products derived from long-term datasets. In this paper, we provide an introduction to cloud computing, describe current uses of the cloud for management and analysis of observational data and model results, and describe workflows for running models and streaming observational data. We discuss topics that must be considered when moving to the cloud: costs, security, and organizational limitations on cloud use. Future uses of the cloud via computational sandboxes and the practicalities and considerations of using the cloud to archive data are explored. We also consider the ways in which the human elements of ocean observations are changing – the rise of a generation of researchers whose observations are likely to be made remotely rather than hands on – and how their expectations and needs drive research towards the cloud. In conclusion, visions of a future where cloud computing is ubiquitous are discussed."],"timdex_record_id":"whoas:1912-24316","title":"From the oceans to the cloud: Opportunities and challenges for data, models, computation and workflows."},"highlight":{"title":["From the oceans to the cloud: Opportunities and challenges for <span class=\"highlight\">data</span>, models, computation and workflows"]}},{"_index":"rdizenodo-2022-07-13t19-23-57z","_type":"_doc","_id":"zenodo:4088660","_score":3.0518131,"_source":{"citation":"Hazboun, Jeffrey S (2020): Pulsar Data Toolbox. Zenodo. Software. https://zenodo.org/record/4088660","content_type":["Software"],"contributors":[{"affiliation":["University of Washington Bothell"],"kind":"Creator","identifier":["https://orcid.org/0000-0003-2742-3321"],"value":"Hazboun, Jeffrey S"}],"dates":[{"kind":"Publication date","value":"2020"},{"kind":"Issued","value":"2020-10-14"}],"edition":"0.2.2","format":"electronic resource","identifiers":[{"kind":"DOI","value":"10.5281/zenodo.4088660"},{"kind":"url","value":"https://zenodo.org/record/4088660"}],"publication_information":["Zenodo"],"related_items":[{"relationship":"IsVersionOf","uri":"https://doi.org/10.5281/zenodo.4088659"},{"relationship":"IsPartOf","uri":"https://zenodo.org/communities/astronomy-general"}],"rights":[{"uri":"https://creativecommons.org/licenses/by/4.0/legalcode"},{"uri":"info:eu-repo/semantics/openAccess"}],"source":"Zenodo","source_link":"https://zenodo.org/record/4088660","subjects":[{"kind":"Subject scheme not provided","value":["Pulsars, PTA, data, PSRFITS"]}],"summary":["\u003cp\u003eA software suite used for building PSRFITS data standard files in Python.\u0026nbsp;\u003c/p\u003e"],"timdex_record_id":"zenodo:4088660","title":"Pulsar Data Toolbox"},"highlight":{"title":["Pulsar <span class=\"highlight\">Data</span> Toolbox"]}},{"_index":"rdiwhoas-2022-07-13t19-24-52z","_type":"_doc","_id":"whoas:1912-8672","_score":3.0450268,"_source":{"citation":"Seismological Research Letters 88 (2017): 23-31","content_type":["Article"],"contributors":[{"kind":"author","value":"Flores, Claudia H."},{"kind":"author","value":"ten Brink, Uri S."},{"kind":"author","value":"McGuire, Jeffrey J."},{"kind":"author","value":"Collins, John A."}],"dates":[{"kind":"accessioned","value":"2017-01-30T19:24:18Z"},{"kind":"available","value":"2017-11-02T08:38:36Z"},{"kind":"Publication date","value":"2016-11-02"}],"format":"electronic resource","funding_information":[{"funder_name":"This project was partially\r\nfunded by the Nuclear Regulatory Commission under NRC\r\nJob Number V6166."}],"identifiers":[{"kind":"uri","value":"https://hdl.handle.net/1912/8672"},{"kind":"doi","value":"10.1785/0220160079"}],"languages":["en_US"],"links":[{"kind":"Digital object URL","text":"Digital object URL","url":"https://hdl.handle.net/1912/8672"}],"notes":[{"value":["Author Posting. © Seismological Society of America, 2016.  This article is posted here by permission of Seismological Society of America for personal use, not for redistribution.  The definitive version was published in Seismological Research Letters 88 (2017): 23-31, doi:10.1785/0220160079."]},{"kind":"embargo","value":["2017-11-02"]}],"publication_information":["Seismological Society of America"],"related_items":[{"uri":"https://doi.org/10.1785/0220160079"}],"source":"Woods Hole Open Access Server","source_link":"https://darchive.mblwhoilibrary.org/handle/1912/8672","summary":["Earthquake data from two short‐period ocean‐bottom seismometer (OBS) networks deployed for over a year on the continental slope off New York and southern New England were used to evaluate seismicity and ground motions along the continental margin. Our OBS networks located only one earthquake of Mc∼1.5 near the shelf edge during six months of recording, suggesting that seismic activity (MLg\u003e3.0) of the margin as far as 150–200 km offshore is probably successfully monitored by land stations without the need for OBS deployments. The spectral acceleration from two local earthquakes recorded by the OBS was found to be generally similar to the acceleration from these earthquakes recorded at several seismic stations on land and to hybrid empirical acceleration relationships for eastern North America. Therefore, the seismic attenuation used for eastern North America can be extended in this region at least to the continental slope. However, additional offshore studies are needed to verify these preliminary conclusions."],"timdex_record_id":"whoas:1912-8672","title":"Observations of seismicity and ground motion in the Northeast U.S. Atlantic Margin from ocean‐bottom seismometer data"},"highlight":{"title":["Atlantic Margin from ocean‐bottom seismometer <span class=\"highlight\">data</span>"]}},{"_index":"rdiwhoas-2022-07-13t19-24-52z","_type":"_doc","_id":"whoas:1912-8744","_score":2.8914313,"_source":{"citation":"Geochemistry, Geophysics, Geosystems 17 (2016): 4354–4365","content_type":["Article"],"contributors":[{"kind":"author","value":"Brothers, Laura L."},{"kind":"author","value":"Herman, Bruce M."},{"kind":"author","value":"Hart, Patrick E."},{"kind":"author","value":"Ruppel, Carolyn D."}],"dates":[{"kind":"accessioned","value":"2017-02-27T18:50:20Z"},{"kind":"available","value":"2017-05-04T08:06:02Z"},{"kind":"Publication date","value":"2016-11-04"}],"format":"electronic resource","funding_information":[{"funder_name":"DOE NETL/NRC Methane Hydrate Fellowship Grant Number: DE-FC26-05NT42248;\r\n    USGS–DOE Interagency Agreements Grant Number: DE-FE000291 and 0023495"}],"identifiers":[{"kind":"uri","value":"https://hdl.handle.net/1912/8744"},{"kind":"doi","value":"10.1002/2016GC006584"}],"languages":["en_US"],"links":[{"kind":"Digital object URL","text":"Digital object URL","url":"https://hdl.handle.net/1912/8744"}],"notes":[{"value":["Author Posting. © American Geophysical Union, 2016.  This article is posted here by permission of American Geophysical Union for personal use, not for redistribution.  The definitive version was published in Geochemistry, Geophysics, Geosystems 17 (2016): 4354–4365, doi:10.1002/2016GC006584."]},{"kind":"embargo","value":["2017-05-04"]}],"publication_information":["John Wiley \u0026 Sons"],"related_items":[{"uri":"https://doi.org/10.1002/2016GC006584"}],"source":"Woods Hole Open Access Server","source_link":"https://darchive.mblwhoilibrary.org/handle/1912/8744","subjects":[{"kind":"Subject scheme not provided","value":["Subsea permafrost","Gas hydrates","Multichannel seismic data","Arctic Ocean"]}],"summary":["Subsea ice-bearing permafrost (IBPF) and associated gas hydrate in the Arctic have been subject to a warming climate and saline intrusion since the last transgression at the end of the Pleistocene. The consequent degradation of IBPF is potentially associated with significant degassing of dissociating gas hydrate deposits. Previous studies interpreted the distribution of subsea permafrost on the U.S. Beaufort continental shelf based on geographically sparse data sets and modeling of expected thermal history. The most cited work projects subsea permafrost to the shelf edge (∼100 m isobath). This study uses a compilation of stacking velocity analyses from ∼100,000 line-km of industry-collected multichannel seismic reflection data acquired over 57,000 km2 of the U.S. Beaufort shelf to delineate continuous subsea IBPF. Gridded average velocities of the uppermost 750 ms two-way travel time range from 1475 to 3110 m s−1. The monotonic, cross-shore pattern in velocity distribution suggests that the seaward extent of continuous IBPF is within 37 km of the modern shoreline at water depths \u003c 25 m. These interpretations corroborate recent Beaufort seismic refraction studies and provide the best, margin-scale evidence that continuous subsea IBPF does not currently extend to the northern limits of the continental shelf."],"timdex_record_id":"whoas:1912-8744","title":"Subsea ice-bearing permafrost on the U.S. Beaufort Margin : 1. Minimum seaward extent defined from multichannel seismic reflection data"},"highlight":{"title":["Minimum seaward extent defined from multichannel seismic reflection <span class=\"highlight\">data</span>"]}},{"_index":"rdiwhoas-2022-07-13t19-24-52z","_type":"_doc","_id":"whoas:1912-24300","_score":2.8914313,"_source":{"citation":"Lentz, E. E., Plant, N. G., \u0026 Thieler, E. R. (2019). Relationships between regional coastal land cover distributions and elevation reveal data uncertainty in a sea-level rise impacts model. Earth Surface Dynamics, 7(2), 429-438","content_type":["Article"],"contributors":[{"kind":"author","value":"Lentz, Erika E."},{"kind":"author","value":"Plant, Nathaniel G."},{"kind":"author","value":"Thieler, E. Robert"}],"dates":[{"kind":"accessioned","value":"2019-07-01T15:57:00Z"},{"kind":"available","value":"2019-07-01T15:57:00Z"},{"kind":"Publication date","value":"2019-05-15"}],"format":"electronic resource","funding_information":[{"funder_name":"This research was funded by the U.S. Geological Survey Coastal and Marine Geology Program. We thank P. Soupy Dalyander for early reviews and discussion of this paper. Any use of trade, firm, or product names is for descriptive purposes only and does not imply endorsement by the US Government."}],"identifiers":[{"kind":"uri","value":"https://hdl.handle.net/1912/24300"},{"kind":"doi","value":"10.5194/esurf-7-429-2019"}],"links":[{"kind":"Digital object URL","text":"Digital object URL","url":"https://hdl.handle.net/1912/24300"}],"notes":[{"value":["© The Author(s), 2019. This article is distributed under the terms of the Creative Commons Attribution License. The definitive version was published in Lentz, E. E., Plant, N. G., \u0026 Thieler, E. R. Relationships between regional coastal land cover distributions and elevation reveal data uncertainty in a sea-level rise impacts model. Earth Surface Dynamics, 7(2), (2019):429-438, doi:10.5194/esurf-7-429-2019."]}],"publication_information":["European Geosciences Union"],"related_items":[{"uri":"https://doi.org/10.5194/esurf-7-429-2019"}],"rights":[{},{"uri":"http://creativecommons.org/licenses/by/4.0/"}],"source":"Woods Hole Open Access Server","source_link":"https://darchive.mblwhoilibrary.org/handle/1912/24300","summary":["Understanding land loss or resilience in response to sea-level rise (SLR) requires spatially extensive and continuous datasets to capture landscape variability. We investigate the sensitivity and skill of a model that predicts dynamic response likelihood to SLR across the northeastern US by exploring several data inputs and outcomes. Using elevation and land cover datasets, we determine where data error is likely, quantify its effect on predictions, and evaluate its influence on prediction confidence. Results show data error is concentrated in low-lying areas with little impact on prediction skill, as the inherent correlation between the datasets can be exploited to reduce data uncertainty using Bayesian inference. This suggests the approach may be extended to regions with limited data availability and/or poor quality. Furthermore, we verify that model sensitivity in these first-order landscape change assessments is well-matched to larger coastal process uncertainties, for which process-based models are important complements to further reduce uncertainty."],"timdex_record_id":"whoas:1912-24300","title":"Relationships between regional coastal land cover distributions and elevation reveal data uncertainty in a sea-level rise impacts model"},"highlight":{"title":["Relationships between regional coastal land cover distributions and elevation reveal <span class=\"highlight\">data</span> uncertainty"]}},{"_index":"rdizenodo-2022-07-13t19-23-57z","_type":"_doc","_id":"zenodo:3356710","_score":2.8787055,"_source":{"citation":"Boulangier, Jels, Gobrecht, David (2019): Thermodynamic data for astrochemistry. Zenodo. Dataset. https://zenodo.org/record/3356710","content_type":["Dataset"],"contributors":[{"affiliation":["KU Leuven"],"kind":"Creator","identifier":["https://orcid.org/0000-0003-0620-658X"],"value":"Boulangier, Jels"},{"affiliation":["KU Leuven"],"kind":"Creator","identifier":["https://orcid.org/0000-0002-3443-3416"],"value":"Gobrecht, David"}],"dates":[{"kind":"Publication date","value":"2019"},{"kind":"Issued","value":"2019-03-12"}],"edition":"1.1.0","format":"electronic resource","funding_information":[{"award_number":"646758","award_uri":"info:eu-repo/grantAgreement/EC/H2020/646758/","funder_identifier":"10.13039/100010661","funder_identifier_type":"Crossref Funder ID","funder_name":"European Commission"}],"identifiers":[{"kind":"DOI","value":"10.5281/zenodo.3356710"},{"kind":"url","value":"https://zenodo.org/record/3356710"}],"languages":["en"],"notes":[{"kind":"Other","value":["This data is produced and used by Boulangier et al. 2019b (subm.)"]}],"publication_information":["Zenodo"],"related_items":[{"relationship":"IsVersionOf","uri":"https://doi.org/10.5281/zenodo.2590674"},{"relationship":"IsPartOf","uri":"https://zenodo.org/communities/astronomy-general"}],"rights":[{"uri":"https://creativecommons.org/licenses/by/4.0/legalcode"},{"uri":"info:eu-repo/semantics/openAccess"}],"source":"Zenodo","source_link":"https://zenodo.org/record/3356710","subjects":[{"kind":"Subject scheme not provided","value":["astrochemistry"]},{"kind":"Subject scheme not provided","value":["thermodynamics"]},{"kind":"Subject scheme not provided","value":["astronomy"]}],"summary":["\u003cp\u003eCollection of thermodynamic properties of 78 chemical species. The properties include partition functions, rotational and vibrational temperatures, electronic energy levels, the electronic potential energies at 0K., and several minimum energy geometries. The main purpose of this data is to compute the Gibbs free energies of the species, to be used in chemical reaction rates. Therefore, these are provided in the output directory (up to 3000K). A easily exportable JSON file with all thermodynamic properties is also available in the output directory. The data has partially been collected from several databases and individual papers. Missing data has been computed by ourselves. All input data is homogenised to a single format, which is not the case when collected from different sources. The reference folder contains extensive information on the sources where we got the data from. More detailed explanations can be found in the several README files. All processing has been performed using my repository of python scripts (https://bitbucket.org/JelsB/thermochemistry). We encourage people to extend the scripts with more features and extend the data with more chemical species. This work strives towards consistency, since we (and others) found inconsistencies between the thermodynamic databases \u003cem\u003eNIST/JANAF tables\u003c/em\u003e and NASA\u0026#39;s \u003cem\u003eThird Millennium Ideal Gas and Condensed Phase Thermochemical Database for Combustion with Updates from Active Thermochemical Tables. \u003c/em\u003e\u003c/p\u003e"],"timdex_record_id":"zenodo:3356710","title":"Thermodynamic data for astrochemistry"},"highlight":{"title":["Thermodynamic <span class=\"highlight\">data</span> for astrochemistry"]}},{"_index":"rdizenodo-2022-07-13t19-23-57z","_type":"_doc","_id":"zenodo:2590675","_score":2.8787055,"_source":{"citation":"Boulangier, Jels, Gobrecht, David (2019): Thermodynamic data for astrochemistry. Zenodo. Dataset. https://zenodo.org/record/2590675","content_type":["Dataset"],"contributors":[{"affiliation":["KU Leuven"],"kind":"Creator","identifier":["https://orcid.org/0000-0003-0620-658X"],"value":"Boulangier, Jels"},{"affiliation":["KU Leuven"],"kind":"Creator","identifier":["https://orcid.org/0000-0002-3443-3416"],"value":"Gobrecht, David"}],"dates":[{"kind":"Publication date","value":"2019"},{"kind":"Issued","value":"2019-03-12"}],"edition":"1.0.0","format":"electronic resource","funding_information":[{"award_number":"646758","award_uri":"info:eu-repo/grantAgreement/EC/H2020/646758/","funder_identifier":"10.13039/100010661","funder_identifier_type":"Crossref Funder ID","funder_name":"European Commission"}],"identifiers":[{"kind":"DOI","value":"10.5281/zenodo.2590675"},{"kind":"url","value":"https://zenodo.org/record/2590675"}],"notes":[{"kind":"Other","value":["This data is produced and used by Boulangier et al. 2019b (subm.)"]}],"publication_information":["Zenodo"],"related_items":[{"relationship":"IsVersionOf","uri":"https://doi.org/10.5281/zenodo.2590674"},{"relationship":"IsPartOf","uri":"https://zenodo.org/communities/astronomy-general"}],"rights":[{"uri":"https://creativecommons.org/licenses/by/4.0/legalcode"},{"uri":"info:eu-repo/semantics/openAccess"}],"source":"Zenodo","source_link":"https://zenodo.org/record/2590675","subjects":[{"kind":"Subject scheme not provided","value":["astrochemistry"]},{"kind":"Subject scheme not provided","value":["thermodynamics"]},{"kind":"Subject scheme not provided","value":["astronomy"]}],"summary":["\u003cp\u003eCollection of thermodynamic properties of 78 chemical species. The properties include partition functions, rotational and vibrational temperatures, electronic energy levels, the electronic potential energies at 0K., and several minimum energy geometries. The main purpose of this data is to compute the Gibbs free energies of the species, to be used in chemical reaction rates. Therefore, these are provided in the output directory (up to 3000K). A easily exportable JSON file with all thermodynamic properties is also available in the output directory. The data has partially been collected from several databases and individual papers. Missing data has been computed by ourselves. All input data is homogenised to a single format, which is not the case when collected from different sources. The reference folder contains extensive information on the sources where we got the data from. More detailed explanations can be found in the several README files. All processing has been performed using my repository of python scripts (https://bitbucket.org/JelsB/thermochemistry). We encourage people to extend the scripts with more features and extend the data with more chemical species. This work strives towards consistency, since we (and others) found inconsistencies between the thermodynamic databases \u003cem\u003eNIST/JANAF tables\u003c/em\u003e and NASA\u0026#39;s \u003cem\u003eThird Millennium Ideal Gas and Condensed Phase Thermochemical Database for Combustion with Updates from Active Thermochemical Tables. \u003c/em\u003e\u003c/p\u003e"],"timdex_record_id":"zenodo:2590675","title":"Thermodynamic data for astrochemistry"},"highlight":{"title":["Thermodynamic <span class=\"highlight\">data</span> for astrochemistry"]}},{"_index":"rdiwhoas-2022-07-13t19-24-52z","_type":"_doc","_id":"whoas:1912-10454","_score":2.820301,"_source":{"citation":"Remote Sensing 10 (2018): 792","content_type":["Article"],"contributors":[{"kind":"author","value":"Baughman, Carson A."},{"kind":"author","value":"Jones, Benjamin M."},{"kind":"author","value":"Bodony, Karin L."},{"kind":"author","value":"Mann, Daniel H."},{"kind":"author","value":"Larsen, Chris F."},{"kind":"author","value":"Himelstoss, Emily"},{"kind":"author","value":"Smith, Jeremy"}],"dates":[{"kind":"accessioned","value":"2018-07-05T17:57:43Z"},{"kind":"available","value":"2018-07-05T17:57:43Z"},{"kind":"Publication date","value":"2018-05-19"}],"format":"electronic resource","funding_information":[{"funder_name":"Funding for this research was provided by the U.S. Geological Survey Land Change Science\r\nand Land Remote Sensing programs, the U.S. Fish andWildlife Service and the University of Alaska Fairbanks."}],"identifiers":[{"kind":"uri","value":"https://hdl.handle.net/1912/10454"},{"kind":"doi","value":"10.3390/rs10050792"}],"languages":["en_US"],"links":[{"kind":"Digital object URL","text":"Digital object URL","url":"https://hdl.handle.net/1912/10454"}],"notes":[{"value":["© The Author(s), 2018. This article is distributed under the terms of the Creative Commons Attribution License. The definitive version was published in Remote Sensing 10 (2018): 792, doi:10.3390/rs10050792."]}],"publication_information":["MDPI AG"],"related_items":[{"uri":"https://doi.org/10.3390/rs10050792"}],"rights":[{},{"uri":"http://creativecommons.org/licenses/by/4.0/"}],"source":"Woods Hole Open Access Server","source_link":"https://darchive.mblwhoilibrary.org/handle/1912/10454","subjects":[{"kind":"Subject scheme not provided","value":["Remote sensing","LiDAR","Sand dunes","Permafrost","Migration","Sub-Arctic"]}],"summary":["This study uses an airborne Light Detection and Ranging (LiDAR) survey, historical aerial photography and historical climate data to describe the character and dynamics of the Nogahabara Sand Dunes, a sub-Arctic dune field in interior Alaska’s discontinuous permafrost zone. The Nogahabara Sand Dunes consist of a 43-km2 area of active transverse and barchanoid dunes within a 3200-km2 area of vegetated dune and sand sheet deposits. The average dune height in the active portion of the dune field is 5.8 m, with a maximum dune height of 28 m. Dune spacing is variable with average crest-to-crest distances for select transects ranging from 66–132 m. Between 1952 and 2015, dunes migrated at an average rate of 0.52 m a−1. Dune movement was greatest between 1952 and 1978 (0.68 m a−1) and least between 1978 and 2015 (0.43 m a−1). Dunes migrated predominantly to the southeast; however, along the dune field margin, net migration was towards the edge of the dune field regardless of heading. Better constraining the processes controlling dune field dynamics at the Nogahabara dunes would provide information that can be used to model possible reactivation of more northerly dune fields and sand sheets in response to climate change, shifting fire regimes and permafrost thaw."],"timdex_record_id":"whoas:1912-10454","title":"Remotely sensing the morphometrics and dynamics of a cold region dune field using historical aerial photography and airborne LIDAR data"},"highlight":{"title":["morphometrics and dynamics of a cold region dune field using historical aerial photography and airborne LIDAR <span class=\"highlight\">data</span>"]}},{"_index":"rdizenodo-2022-07-13t19-23-57z","_type":"_doc","_id":"zenodo:5728409","_score":2.724182,"_source":{"citation":"Stevens, Abigail (2021): Data for time series tutorial. Zenodo. Dataset. https://zenodo.org/record/5728409","content_type":["Dataset"],"contributors":[{"affiliation":["Michigan State Univ. and Univ. of Michigan"],"kind":"Creator","identifier":["https://orcid.org/0000-0002-5041-3079"],"value":"Stevens, Abigail"}],"dates":[{"kind":"Publication date","value":"2021"},{"kind":"Issued","value":"2021-11-25"}],"format":"electronic resource","identifiers":[{"kind":"DOI","value":"10.5281/zenodo.5728409"},{"kind":"url","value":"https://zenodo.org/record/5728409"}],"languages":["en"],"notes":[{"kind":"Other","value":["{\"references\": [\"Wilson-Hodge, C. et al. (2018). \\\"NICER and Fermi GBM Observations of the First Galactic Ultraluminous X-Ray Pulsar Swift J0243.6+6124,\\\" ApJ, 863, 9.\", \"Stevens, A.L. et al. (2018). \\\" A NICER Discovery of a Low-frequency Quasi-periodic Oscillation in the Soft-intermediate State of MAXI J1535-571,\\\" ApJ, 865, L15.\"]}"]}],"publication_information":["Zenodo"],"related_items":[{"relationship":"IsVersionOf","uri":"https://doi.org/10.5281/zenodo.5728408"},{"relationship":"IsPartOf","uri":"https://zenodo.org/communities/astronomy-general"}],"rights":[{"uri":"https://creativecommons.org/licenses/by/4.0/legalcode"},{"uri":"info:eu-repo/semantics/openAccess"}],"source":"Zenodo","source_link":"https://zenodo.org/record/5728409","subjects":[{"kind":"Subject scheme not provided","value":["astronomy"]}],"summary":["\u003cp\u003eThese are sample data files to be used in the time series tutorial found here: \u003ca href=\"https://github.com/abigailStev/timeseries-tutorial\"\u003ehttps://github.com/abigailStev/timeseries-tutorial \u003c/a\u003e\u003c/p\u003e\n\n\u003cp\u003eThey are public datasets from the NICER X-ray Timing Instrument of a black hole, MAXI J1535-571, and a neutron star, Swift J0243.6+6124. There are also Good Time Intervals I created for each of the photon event lists.\u003c/p\u003e"],"timdex_record_id":"zenodo:5728409","title":"Data for time series tutorial"},"highlight":{"title":["<span class=\"highlight\">Data</span> for time series tutorial"]}},{"_index":"rdizenodo-2022-07-13t19-23-57z","_type":"_doc","_id":"zenodo:3221478","_score":2.724182,"_source":{"citation":"Foreman-Mackey, Daniel (2017): Fitting a plane to data. Zenodo. Text. https://zenodo.org/record/3221478","content_type":["Text"],"contributors":[{"kind":"Creator","identifier":["https://orcid.org/0000-0002-9328-5652"],"value":"Foreman-Mackey, Daniel"}],"dates":[{"kind":"Publication date","value":"2017"},{"kind":"Issued","value":"2017-06-01"}],"format":"electronic resource","identifiers":[{"kind":"DOI","value":"10.5281/zenodo.3221478"},{"kind":"url","value":"https://zenodo.org/record/3221478"}],"languages":["en"],"notes":[{"kind":"Datacite resource type","value":["Technical note"]}],"publication_information":["Zenodo"],"related_items":[{"relationship":"IsVersionOf","uri":"https://doi.org/10.5281/zenodo.3221477"},{"relationship":"IsPartOf","uri":"https://zenodo.org/communities/astronomy-general"}],"rights":[{"uri":"https://creativecommons.org/licenses/by/4.0/legalcode"},{"uri":"info:eu-repo/semantics/openAccess"}],"source":"Zenodo","source_link":"https://zenodo.org/record/3221478","summary":["\u003cp\u003eMy blog post about how to fit a plane to data:\u0026nbsp;\u003ca href=\"https://dfm.io/posts/fitting-a-plane/\"\u003ehttps://dfm.io/posts/fitting-a-plane/\u003c/a\u003e\u003c/p\u003e"],"timdex_record_id":"zenodo:3221478","title":"Fitting a plane to data"},"highlight":{"title":["Fitting a plane to <span class=\"highlight\">data</span>"]}},{"_index":"rdizenodo-2022-07-13t19-23-57z","_type":"_doc","_id":"zenodo:6611382","_score":2.5854023,"_source":{"citation":"Lokken, Martine, Gagliano, Alexander, Narayan, Gautham, Hložek, Renée, Kessler, Richard, Crenshaw, John Franklin, Salo, Laura, Alves, Catarina S., Chatterjee, Deep, Vincenzi, Maria, Malz, Alex I. (2022): SCOTCH Catalogue and Associated Data Files. Zenodo. Dataset. https://zenodo.org/record/6611382","content_type":["Dataset"],"contributors":[{"affiliation":["University of Toronto"],"kind":"Creator","identifier":["https://orcid.org/0000-0001-5917-955X"],"value":"Lokken, Martine"},{"affiliation":["University of Illinois at Urbana-Champaign"],"kind":"Creator","identifier":["https://orcid.org/0000-0003-4906-8447"],"value":"Gagliano, Alexander"},{"affiliation":["University of Illinois at Urbana-Champaign"],"kind":"Creator","identifier":["https://orcid.org/0000-0001-6022-0484"],"value":"Narayan, Gautham"},{"affiliation":["University of Toronto"],"kind":"Creator","identifier":["https://orcid.org/0000-0002-0965-7864"],"value":"Hložek, Renée"},{"affiliation":["University of Chicago"],"kind":"Creator","identifier":["https://orcid.org/0000-0003-3221-0419"],"value":"Kessler, Richard"},{"affiliation":["University of Washington"],"kind":"Creator","identifier":["https://orcid.org/0000-0002-2495-3514"],"value":"Crenshaw, John Franklin"},{"affiliation":["University of Minnesota"],"kind":"Creator","identifier":["https://orcid.org/0000-0001-5473-6871"],"value":"Salo, Laura"},{"affiliation":["University College London"],"kind":"Creator","identifier":["https://orcid.org/0000-0002-6164-9044"],"value":"Alves, Catarina S."},{"affiliation":["University of Illinois at Urbana-Champaign"],"kind":"Creator","identifier":["https://orcid.org/0000-0003-0038-5468"],"value":"Chatterjee, Deep"},{"affiliation":["Duke University"],"kind":"Creator","identifier":["https://orcid.org/0000-0001-8788-1688"],"value":"Vincenzi, Maria"},{"affiliation":["Ruhr-University Bochum"],"kind":"Creator","identifier":["https://orcid.org/0000-0002-8676-1622"],"value":"Malz, Alex I."}],"dates":[{"kind":"Publication date","value":"2022"},{"kind":"Issued","value":"2022-06-01"}],"edition":"1.0","format":"electronic resource","identifiers":[{"kind":"DOI","value":"10.5281/zenodo.6611382"},{"kind":"url","value":"https://zenodo.org/record/6611382"}],"languages":["en"],"publication_information":["Zenodo"],"related_items":[{"relationship":"IsVersionOf","uri":"https://doi.org/10.5281/zenodo.6601210"},{"relationship":"IsPartOf","uri":"https://zenodo.org/communities/astronomy-general"}],"rights":[{"uri":"https://creativecommons.org/licenses/by/4.0/legalcode"},{"uri":"info:eu-repo/semantics/openAccess"}],"source":"Zenodo","source_link":"https://zenodo.org/record/6611382","subjects":[{"kind":"Subject scheme not provided","value":["large-scale surveys"]},{"kind":"Subject scheme not provided","value":["transient science"]},{"kind":"Subject scheme not provided","value":["simulations"]}],"summary":["\u003cp\u003e\u003cstrong\u003eThe Simulated Catalogue of Optical Transients and Correlated Hosts (SCOTCH)\u003c/strong\u003e\u003c/p\u003e\n\n\u003cp\u003eThis is a \u003cem\u003estatic\u003c/em\u003e data release for SCOTCH, a catalogue containing 5 million explosive transients and the properties of their realistically-associated host galaxies. The catalogue consists of 13 transient classes: 3 SN Ia classes (Ia, Iax, Ia 91bg-like), 2 H-rich core-collapse classes (II, IIn), 5 H-poor classes (Ib, Ic, Ic-BL, IIb, SLSN-I), and 3 non-SN classes (AGN, KN, TDE). Details on the methodology used to construct these data can be found in Lokken, Gagliano, et al. (2022) and the associated repo for this work is located at \u003ca href=\"https://github.com/LSSTDESC/transient-host-sims\"\u003ehttps://github.com/LSSTDESC/transient-host-sims\u003c/a\u003e. This data release consists of three types of files:\u003c/p\u003e\n\n\u003cp\u003e\u003cstrong\u003eSCOTCH Catalogues (scotch_z3.hdf5, scotch_zlim.hdf5): \u003c/strong\u003e\u003c/p\u003e\n\n\u003col\u003e\n\t\u003cli\u003e\u003cstrong\u003escotch_z3.hdf5: \u003c/strong\u003eThis is a catalogue of 5M transients and host properties for 13 transient classes within \u003cspan class=\"math-tex\"\u003e\\(0\u0026lt;z\u0026lt;3\\)\u003c/span\u003e. The relative rates between classes are not realistic. The catalogue consists of two main tables: the \u003cem\u003eTransient Table\u003c/em\u003e and the \u003cem\u003eHost Table. \u003c/em\u003eThe \u003cem\u003eTransient Table \u003c/em\u003econtains true, top-of-the-galaxy light curves in Vera Rubin Observatory LSST passbands (\u003cem\u003eugrizY\u003c/em\u003e) for each of the simulated transients. The \u003cem\u003eHost Table\u003c/em\u003e contains information about the host galaxies of each transient, including apparent magnitude in LSST passbands, shape, star-formation rate, and stellar mass. The two tables are linked and can be cross-matched by \u003cem\u003eTID\u003c/em\u003e, the unique integer ID of a simulated transient; and \u003cem\u003eGID\u003c/em\u003e, the unique integer ID of each host galaxy.\u003c/li\u003e\n\t\u003cli\u003e\u003cstrong\u003escotch_zlim.hdf5 \u003c/strong\u003e(soon to be added!)\u003cstrong\u003e: \u003c/strong\u003eThis catalogue consists of 5M events simulated in SNANA with an upper redshift limit of \u003cspan class=\"math-tex\"\u003e\\(z\u0026lt;0.8\\)\u003c/span\u003e. More events are simulated at lower redshift than SCOTCH_Z3.hdf5, so this catalogue might be more valuable for low-z studies (e.g., of KNe).\u003c/li\u003e\n\u003c/ol\u003e\n\n\u003cp\u003eThe full organization of the catalogue is shown in Figure B1 of our paper, and we provide a list of the schema as Tables 4 and 5. Tutorials for querying the database for specific science cases are available at \u003ca href=\"https://github.com/LSSTDESC/transient-host-sims/blob/main/notebooks/SCOTCH_walkthroughs.ipynb\"\u003ehttps://github.com/LSSTDESC/transient-host-sims/blob/main/notebooks/SCOTCH_walkthroughs.ipynb\u003c/a\u003e.\u003c/p\u003e\n\n\u003cp\u003eIf all you want are the data products, then you\u0026#39;re done! If you\u0026#39;re interested in generating new simulations or are just curious to learn about how we simulated realistic host galaxy correlations, check out the two types of supplemental data files:\u003c/p\u003e\n\n\u003cp\u003e\u003cstrong\u003eHOSTLIBs (*_GHOST.HOSTLIB.gz):\u003c/strong\u003e\u003c/p\u003e\n\n\u003cp\u003eThe libraries of candidate CosmoDC2 host galaxies to which simulated transients are matched. These files can be used to rerun SNANA for unique survey strategies (footprint, cadence, etc), and were generated using \u003ca href=\"https://github.com/LSSTDESC/transient-host-sims/blob/main/notebooks/Hostlib_Constructor.ipynb\"\u003ehttps://github.com/LSSTDESC/transient-host-sims/blob/main/notebooks/Hostlib_Constructor.ipynb\u003c/a\u003e. The transients we\u0026#39;ve simulated use one of five HOSTLIBs: \u003cem\u003eSNIa\u003c/em\u003e, \u003cem\u003eSNIbc\u003c/em\u003e, \u003cem\u003eSNII\u003c/em\u003e, \u003cem\u003eUNMATCHED\u003c/em\u003e, and \u003cem\u003eUNMATCHED_KN\u003c/em\u003e. The first three of these HOSTLIBs encode correlations from the GHOST catalogue (Gagliano+2021). The last two contain representative subsets of CosmoDC2 (no explicit host correlations), and the last file contains galaxies whose photometry has been slightly modified to introduce realistic scatter into the color-color distribution of matched KN host galaxies.\u003c/p\u003e\n\n\u003cp\u003eThe data in these files roughly match the final galaxy properties listed in the SCOTCH catalogue, with one exception: \u003cem\u003eNBR_LIST\u003c/em\u003e, the cosmoDC2 IDs of other galaxies in that HOSTLIB within a 10\u0026#39;\u0026#39; radius of a given galaxy. This is useful for calculating the directional light radius (Gupta+2016) to each transient and realistically mis-associating some hosts (as will be done for ELAsTiCC).\u003c/p\u003e\n\n\u003cp\u003e\u0026nbsp;\u003c/p\u003e\n\n\u003cp\u003e\u003cstrong\u003eWGTMAPs (*_GHOST.WGTMAP.gz): \u003c/strong\u003e\u003c/p\u003e\n\n\u003cp\u003eThe Probability Density Functions (PDFs) describing the probability of a class of transient to occur in a galaxy of certain properties. These can be used as input to rerun SNANA, and were generated using the script \u003ca href=\"https://github.com/LSSTDESC/transient-host-sims/blob/main/scripts/weightmap_generator.py\"\u003ehttps://github.com/LSSTDESC/transient-host-sims/blob/main/scripts/weightmap_generator.py.\u003c/a\u003e The galaxy properties over which a PDF is defined is variable, and the PDF of each class has been constructed to encode subtler correlations than are captured in GHOST and known correlations with derived properties (star-formation rate, metallicity, and stellar mass, none of which are estimated in GHOST). Host matching in SNANA is done from the HOSTLIB conditioned on the WGTMAP distributions. File schema is\u003c/p\u003e\n\n\u003cp\u003e\u003cem\u003ex y z WGT SNMAGSHIFT\u003c/em\u003e\u003c/p\u003e\n\n\u003cp\u003eWhere \u003cem\u003exyz\u003c/em\u003e defines a point along a three-dimensional, uniformly-spaced parameter space of host galaxy properties, \u003cem\u003eWGT\u003c/em\u003e defines the weight to assign a galaxy with those properties\u003cem\u003e \u003c/em\u003ein matching, and \u003cem\u003eSNMAGSHIFT \u003c/em\u003edescribes the magnitude offset to attribute to transients matched to a galaxy with these properties (this SNANA functionality is not used). Interpolation is used to determine the weights for HOSTLIB galaxies with properties between grid points.\u003c/p\u003e\n\n\u003cp\u003e\u0026nbsp;\u003c/p\u003e\n\n\u003cp\u003eQuestions? Comments? Please reach out to Martine Lokken (\u003cem\u003elokken@astro.utoronto.ca\u003c/em\u003e) or Alex Gagliano (\u003cem\u003egaglian2@illinois.edu\u003c/em\u003e).\u003c/p\u003e"],"timdex_record_id":"zenodo:6611382","title":"SCOTCH Catalogue and Associated Data Files"},"highlight":{"title":["SCOTCH Catalogue and Associated <span class=\"highlight\">Data</span> Files"]}},{"_index":"rdizenodo-2022-07-13t19-23-57z","_type":"_doc","_id":"zenodo:6671255","_score":2.5854023,"_source":{"citation":"Lokken, Martine, Gagliano, Alexander, Narayan, Gautham, Hložek, Renée, Kessler, Richard, Crenshaw, John Franklin, Salo, Laura, Alves, Catarina S., Chatterjee, Deep, Vincenzi, Maria, Malz, Alex I. (2022): SCOTCH Catalogue and Associated Data Files. Zenodo. Dataset. https://zenodo.org/record/6671255","content_type":["Dataset"],"contributors":[{"affiliation":["University of Toronto"],"kind":"Creator","identifier":["https://orcid.org/0000-0001-5917-955X"],"value":"Lokken, Martine"},{"affiliation":["University of Illinois at Urbana-Champaign"],"kind":"Creator","identifier":["https://orcid.org/0000-0003-4906-8447"],"value":"Gagliano, Alexander"},{"affiliation":["University of Illinois at Urbana-Champaign"],"kind":"Creator","identifier":["https://orcid.org/0000-0001-6022-0484"],"value":"Narayan, Gautham"},{"affiliation":["University of Toronto"],"kind":"Creator","identifier":["https://orcid.org/0000-0002-0965-7864"],"value":"Hložek, Renée"},{"affiliation":["University of Chicago"],"kind":"Creator","identifier":["https://orcid.org/0000-0003-3221-0419"],"value":"Kessler, Richard"},{"affiliation":["University of Washington"],"kind":"Creator","identifier":["https://orcid.org/0000-0002-2495-3514"],"value":"Crenshaw, John Franklin"},{"affiliation":["University of Minnesota"],"kind":"Creator","identifier":["https://orcid.org/0000-0001-5473-6871"],"value":"Salo, Laura"},{"affiliation":["University College London"],"kind":"Creator","identifier":["https://orcid.org/0000-0002-6164-9044"],"value":"Alves, Catarina S."},{"affiliation":["University of Illinois at Urbana-Champaign"],"kind":"Creator","identifier":["https://orcid.org/0000-0003-0038-5468"],"value":"Chatterjee, Deep"},{"affiliation":["Duke University"],"kind":"Creator","identifier":["https://orcid.org/0000-0001-8788-1688"],"value":"Vincenzi, Maria"},{"affiliation":["Ruhr-University Bochum"],"kind":"Creator","identifier":["https://orcid.org/0000-0002-8676-1622"],"value":"Malz, Alex I."}],"dates":[{"kind":"Publication date","value":"2022"},{"kind":"Issued","value":"2022-06-01"}],"edition":"1.0","format":"electronic resource","identifiers":[{"kind":"DOI","value":"10.5281/zenodo.6671255"},{"kind":"url","value":"https://zenodo.org/record/6671255"}],"languages":["en"],"publication_information":["Zenodo"],"related_items":[{"relationship":"IsVersionOf","uri":"https://doi.org/10.5281/zenodo.6601210"},{"relationship":"IsPartOf","uri":"https://zenodo.org/communities/astronomy-general"}],"rights":[{"uri":"https://creativecommons.org/licenses/by/4.0/legalcode"},{"uri":"info:eu-repo/semantics/openAccess"}],"source":"Zenodo","source_link":"https://zenodo.org/record/6671255","subjects":[{"kind":"Subject scheme not provided","value":["large-scale surveys"]},{"kind":"Subject scheme not provided","value":["transient science"]},{"kind":"Subject scheme not provided","value":["simulations"]}],"summary":["\u003cp\u003e\u003cstrong\u003eThe Simulated Catalogue of Optical Transients and Correlated Hosts (SCOTCH)\u003c/strong\u003e\u003c/p\u003e\n\n\u003cp\u003eThis is a \u003cem\u003estatic\u003c/em\u003e data release for SCOTCH, a catalogue containing 5 million explosive transients and the properties of their realistically-associated host galaxies. The catalogue consists of 13 transient classes: 3 SN Ia classes (Ia, Iax, Ia 91bg-like), 2 H-rich core-collapse classes (II, IIn), 5 H-poor classes (Ib, Ic, Ic-BL, IIb, SLSN-I), and 3 non-SN classes (AGN, KN, TDE). The parameters available for each transient and host galaxy pair are outlined in \u003cstrong\u003eSCOTCH_schema.md\u003c/strong\u003e.\u003c/p\u003e\n\n\u003cp\u003e\u0026nbsp;\u003c/p\u003e\n\n\u003cp\u003eDetails on the methodology used to construct these data can be found in Lokken, Gagliano, et al. (2022) and the associated repo for this work is located at \u003ca href=\"https://github.com/LSSTDESC/transient-host-sims\"\u003ehttps://github.com/LSSTDESC/transient-host-sims\u003c/a\u003e. This data release consists of three types of files:\u003c/p\u003e\n\n\u003cp\u003e\u003cstrong\u003eSCOTCH Catalogues (scotch_z3.hdf5, scotch_zlim.hdf5): \u003c/strong\u003e\u003c/p\u003e\n\n\u003col\u003e\n\t\u003cli\u003e\u003cstrong\u003escotch_z3.hdf5: \u003c/strong\u003eThis is a catalogue of 5M transients and host properties for 13 transient classes within \u003cspan class=\"math-tex\"\u003e\\(0\u0026lt;z\u0026lt;3\\)\u003c/span\u003e. The relative rates between classes are not realistic. The catalogue consists of two main tables: the \u003cem\u003eTransient Table\u003c/em\u003e and the \u003cem\u003eHost Table. \u003c/em\u003eThe \u003cem\u003eTransient Table \u003c/em\u003econtains true, top-of-the-galaxy light curves in Vera Rubin Observatory LSST passbands (\u003cem\u003eugrizY\u003c/em\u003e) for each of the simulated transients. The \u003cem\u003eHost Table\u003c/em\u003e contains information about the host galaxies of each transient, including apparent magnitude in LSST passbands, shape, star-formation rate, and stellar mass. The two tables are linked and can be cross-matched by \u003cem\u003eTID\u003c/em\u003e, the unique integer ID of a simulated transient; and \u003cem\u003eGID\u003c/em\u003e, the unique integer ID of each host galaxy.\u003c/li\u003e\n\t\u003cli\u003e\u003cstrong\u003escotch_zlim.hdf5 \u003c/strong\u003e(soon to be added!)\u003cstrong\u003e: \u003c/strong\u003eThis catalogue consists of 5M events simulated in SNANA with an upper redshift limit of \u003cspan class=\"math-tex\"\u003e\\(z\u0026lt;0.8\\)\u003c/span\u003e. More events are simulated at lower redshift than SCOTCH_Z3.hdf5, so this catalogue might be more valuable for low-z studies (e.g., of KNe).\u003c/li\u003e\n\u003c/ol\u003e\n\n\u003cp\u003eThe full organization of the catalogue is shown in Figure B1 of our paper, and we provide a list of the schema as Tables 4 and 5. Tutorials for querying the database for specific science cases are available at \u003ca href=\"https://github.com/LSSTDESC/transient-host-sims/blob/main/notebooks/SCOTCH_walkthroughs.ipynb\"\u003ehttps://github.com/LSSTDESC/transient-host-sims/blob/main/notebooks/SCOTCH_walkthroughs.ipynb\u003c/a\u003e.\u003c/p\u003e\n\n\u003cp\u003eIf all you want are the data products, then you\u0026#39;re done! If you\u0026#39;re interested in generating new simulations or are just curious to learn about how we simulated realistic host galaxy correlations, check out the two types of supplemental data files:\u003c/p\u003e\n\n\u003cp\u003e\u003cstrong\u003eHOSTLIBs (*_GHOST.HOSTLIB.gz):\u003c/strong\u003e\u003c/p\u003e\n\n\u003cp\u003eThe libraries of candidate CosmoDC2 host galaxies to which simulated transients are matched. These files can be used to rerun SNANA for unique survey strategies (footprint, cadence, etc), and were generated using \u003ca href=\"https://github.com/LSSTDESC/transient-host-sims/blob/main/notebooks/Hostlib_Constructor.ipynb\"\u003ehttps://github.com/LSSTDESC/transient-host-sims/blob/main/notebooks/Hostlib_Constructor.ipynb\u003c/a\u003e. The transients we\u0026#39;ve simulated use one of five HOSTLIBs: \u003cem\u003eSNIa\u003c/em\u003e, \u003cem\u003eSNIbc\u003c/em\u003e, \u003cem\u003eSNII\u003c/em\u003e, \u003cem\u003eUNMATCHED\u003c/em\u003e, and \u003cem\u003eUNMATCHED_KN\u003c/em\u003e. The first three of these HOSTLIBs encode correlations from the GHOST catalogue (Gagliano+2021). The last two contain representative subsets of CosmoDC2 (no explicit host correlations), and the last file contains galaxies whose photometry has been slightly modified to introduce realistic scatter into the color-color distribution of matched KN host galaxies.\u003c/p\u003e\n\n\u003cp\u003eThe data in these files roughly match the final galaxy properties listed in the SCOTCH catalogue, with one exception: \u003cem\u003eNBR_LIST\u003c/em\u003e, the cosmoDC2 IDs of other galaxies in that HOSTLIB within a 10\u0026#39;\u0026#39; radius of a given galaxy. This is useful for calculating the directional light radius (Gupta+2016) to each transient and realistically mis-associating some hosts (as will be done for ELAsTiCC).\u003c/p\u003e\n\n\u003cp\u003e\u0026nbsp;\u003c/p\u003e\n\n\u003cp\u003e\u003cstrong\u003eWGTMAPs (*_GHOST.WGTMAP.gz): \u003c/strong\u003e\u003c/p\u003e\n\n\u003cp\u003eThe Probability Density Functions (PDFs) describing the probability of a class of transient to occur in a galaxy of certain properties. These can be used as input to rerun SNANA, and were generated using the script \u003ca href=\"https://github.com/LSSTDESC/transient-host-sims/blob/main/scripts/weightmap_generator.py\"\u003ehttps://github.com/LSSTDESC/transient-host-sims/blob/main/scripts/weightmap_generator.py.\u003c/a\u003e The galaxy properties over which a PDF is defined is variable, and the PDF of each class has been constructed to encode subtler correlations than are captured in GHOST and known correlations with derived properties (star-formation rate, metallicity, and stellar mass, none of which are estimated in GHOST). Host matching in SNANA is done from the HOSTLIB conditioned on the WGTMAP distributions. File schema is\u003c/p\u003e\n\n\u003cp\u003e\u003cem\u003ex y z WGT SNMAGSHIFT\u003c/em\u003e\u003c/p\u003e\n\n\u003cp\u003eWhere \u003cem\u003exyz\u003c/em\u003e defines a point along a three-dimensional, uniformly-spaced parameter space of host galaxy properties, \u003cem\u003eWGT\u003c/em\u003e defines the weight to assign a galaxy with those properties\u003cem\u003e \u003c/em\u003ein matching, and \u003cem\u003eSNMAGSHIFT \u003c/em\u003edescribes the magnitude offset to attribute to transients matched to a galaxy with these properties (this SNANA functionality is not used). Interpolation is used to determine the weights for HOSTLIB galaxies with properties between grid points.\u003c/p\u003e\n\n\u003cp\u003e\u0026nbsp;\u003c/p\u003e\n\n\u003cp\u003eQuestions? Comments? Please reach out to Martine Lokken (\u003cem\u003elokken@astro.utoronto.ca\u003c/em\u003e) or Alex Gagliano (\u003cem\u003egaglian2@illinois.edu\u003c/em\u003e).\u003c/p\u003e"],"timdex_record_id":"zenodo:6671255","title":"SCOTCH Catalogue and Associated Data Files"},"highlight":{"title":["SCOTCH Catalogue and Associated <span class=\"highlight\">Data</span> Files"]}}]},"aggregations":{"languages":{"doc_count_error_upper_bound":0,"sum_other_doc_count":0,"buckets":[{"key":"en","doc_count":18},{"key":"en_us","doc_count":8},{"key":"fr","doc_count":1}]},"content_type":{"doc_count_error_upper_bound":0,"sum_other_doc_count":0,"buckets":[{"key":"dataset","doc_count":101},{"key":"article","doc_count":12},{"key":"software","doc_count":5},{"key":"text","doc_count":4},{"key":"preprint","doc_count":2},{"key":"conferencepaper","doc_count":1},{"key":"journalarticle","doc_count":1},{"key":"report","doc_count":1}]},"collections":{"doc_count_error_upper_bound":0,"sum_other_doc_count":0,"buckets":[]},"subjects":{"doc_count":311,"subject_names":{"doc_count_error_upper_bound":5,"sum_other_doc_count":253,"buckets":[{"key":"social sciences","doc_count":60},{"key":"astronomy","doc_count":7},{"key":"alma","doc_count":5},{"key":"medicine, health and life sciences","doc_count":5},{"key":"cooling flows","doc_count":4},{"key":"emission line galaxies","doc_count":4},{"key":"hydrodynamic simulations","doc_count":4},{"key":"hydrodynamics","doc_count":4},{"key":"lyman-alpha galaxies","doc_count":4},{"key":"lyman-break galaxies","doc_count":4}]}},"content_format":{"doc_count_error_upper_bound":0,"sum_other_doc_count":0,"buckets":[{"key":"electronic resource","doc_count":127}]},"literary_form":{"doc_count_error_upper_bound":0,"sum_other_doc_count":0,"buckets":[]},"source":{"doc_count_error_upper_bound":0,"sum_other_doc_count":0,"buckets":[{"key":"abdul latif jameel poverty action lab dataverse","doc_count":60},{"key":"zenodo","doc_count":54},{"key":"woods hole open access server","doc_count":13}]},"contributors":{"doc_count":663,"contributor_names":{"doc_count_error_upper_bound":6,"sum_other_doc_count":595,"buckets":[{"key":"duflo, esther","doc_count":15},{"key":"greenstone, michael","doc_count":10},{"key":"ashraf, nava","doc_count":6},{"key":"banerjee, abhijit","doc_count":6},{"key":"danehkar, ashkbiz","doc_count":6},{"key":"larreguy, horacio","doc_count":6},{"key":"osman, adam","doc_count":6},{"key":"marshall, john","doc_count":5},{"key":"abhijit banerjee","doc_count":4},{"key":"atkin, david","doc_count":4}]}}}} + recorded_at: Wed, 13 Jul 2022 19:37:49 GMT +recorded_with: VCR 6.1.0