diff --git a/.env.test b/.env.test index b9d122d3..21a31af0 100644 --- a/.env.test +++ b/.env.test @@ -2,7 +2,8 @@ EMAIL_FROM=fake@example.com EMAIL_URL_HOST=localhost:3000 JWT_SECRET_KEY=3862fc949629030de4259b88f6e8f7c3702b2fabfc68d00d46fb7f9f70110690b526997ef4d77765ffa010d8aba440286af39947d0c85287174d99be2db14987 OPENSEARCH_INDEX=all-current +AWS_ENDPOINT_URL_LAMBDA=http://localhost:9200 AWS_ACCESS_KEY_ID=test-key AWS_SECRET_ACCESS_KEY=test-secret AWS_REGION=us-east-1 -TIMDEX_SEMANTIC_BUILDER_FUNCTION_NAME=timdex-semantic-builder-test +TIMDEX_SEMANTIC_BUILDER_FUNCTION_NAME=timdex-semantic-builder-prod:live diff --git a/README.md b/README.md index d9c9ce89..91df7493 100644 --- a/README.md +++ b/README.md @@ -85,7 +85,8 @@ end - Run your test(s). You may receive VCR errors as the `opensearch init` cassette does not have the HTTP transaction you are requesting. However, the nested cassette for your test will generate if it does not exist yet and on future runs these errors will not recur. - Manually confirm the headers do not have sensitive information. This scrubbing process should work, but it is your responsibility to ensure you are not committing secrets to code repositories. If you aren't sure, ask. -- You have to remove or comment out AWS credentials from `.env` before re-running your test or the tests will fail (i.e. this process can only generate cassettes, it can not re-run them with AWS credentials as we scrub the AWS bits from the cassette so VCR does not match) +- You have to remove or comment out AWS credentials from `.env` before re-running your test or the tests will fail (i.e. this process can only generate cassettes, it can not re-run them with AWS credentials as we scrub the AWS bits from the cassette so VCR does not match). +- You have to set `AWS_ENDPOINT_URL_LAMBDA` to `http://localhost:9200` in `.env.test` before re-running tests. This is necessary because the initial call uses the default value set by the AWS SDK but subsequent calls use the filtered value. > [!Important] > We re-use OpenSearch connections, which is handled by the nesting of cassettes (see above). If you have sporadically failing tests, ensure you are nesting your test specific cassette inside of the `opensearch init` cassette. diff --git a/app/graphql/types/query_type.rb b/app/graphql/types/query_type.rb index 1142744d..91859d9f 100644 --- a/app/graphql/types/query_type.rb +++ b/app/graphql/types/query_type.rb @@ -67,7 +67,7 @@ def record_id(id:, index:) description: 'How to join multiword queries. Defaults to "OR" which means any ' \ 'of the words much match. Options include: "OR", "AND"' argument :query_mode, String, required: false, default_value: 'keyword', - description: 'Search mode, either "keyword" or "semantic"' + description: 'Search mode: "keyword" (lexical search), "semantic" (vector search), or "hybrid" (both)' # applied filters argument :access_to_files_filter, [String], diff --git a/app/models/hybrid_query_builder.rb b/app/models/hybrid_query_builder.rb new file mode 100644 index 00000000..6cf408b9 --- /dev/null +++ b/app/models/hybrid_query_builder.rb @@ -0,0 +1,69 @@ +class HybridQueryBuilder + def build(params, fulltext: false) + query_text = params[:q].to_s.strip + + lexical_query = LexicalQueryBuilder.new.build(params, fulltext: fulltext) + + # If no query text provided, return lexical query so filters/other constraints are still applied + return lexical_query if query_text.blank? + + begin + semantic_query = SemanticQueryBuilder.new.build(params, fulltext: fulltext) + + # Both succeeded - combine them with should clause while preserving filters + combine_queries(semantic_query, lexical_query) + rescue SemanticQueryBuilder::LambdaError => e + # Lambda service failure - report to Sentry and gracefully fall back to lexical search + Sentry.capture_exception(e, level: 'warning') + Rails.logger.warn( + "HybridQueryBuilder semantic query failed: #{e.class}: #{e.message}" + ) + lexical_query + end + end + + private + + # Combines semantic and lexical queries while preserving non-q filters. + # The q multi_match stays in the lexical branch to allow semantic-only matches. + def combine_queries(semantic_query, lexical_query) + # Extract filters (non-q constraints like title/citation/geo) to apply at top level. + # Do NOT extract must (which contains the q multi_match) - it stays in lexical branch + # so semantic matches can be returned without matching the q query. + lexical_bool = lexical_query.is_a?(Hash) && lexical_query[:bool] ? lexical_query[:bool] : {} + top_level_filters = lexical_bool[:filter] || [] + + # Keep the full lexical query structure (with q multi_match in must) but remove filters + # so we don't duplicate them in the final query + lexical_search = if lexical_query.is_a?(Hash) && lexical_query[:bool] + { + bool: { + should: lexical_bool[:should] || [], + must: lexical_bool[:must] || [] + }.reject { |_, v| v.blank? } + } + else + lexical_query + end + + hybrid_bool = { + should: [ + semantic_query, + lexical_search + ] + } + + # Apply only filters (non-q constraints) at top level so they apply to both branches + hybrid_bool[:filter] = top_level_filters if top_level_filters.present? + + # In OpenSearch, when a bool query has no filters, should clauses are required by default. + # When filters are added, should clauses become optional. We explicitly require at least + # one should clause to match (semantic or lexical) when filters are present, so we don't + # return filter-only results that matched neither branch. + hybrid_bool[:minimum_should_match] = 1 if top_level_filters.present? + + { + bool: hybrid_bool + } + end +end diff --git a/app/models/opensearch.rb b/app/models/opensearch.rb index 7f649c72..d378b219 100644 --- a/app/models/opensearch.rb +++ b/app/models/opensearch.rb @@ -57,6 +57,8 @@ def query builder = case @query_mode when 'semantic' SemanticQueryBuilder.new + when 'hybrid' + HybridQueryBuilder.new else LexicalQueryBuilder.new end diff --git a/app/models/semantic_query_builder.rb b/app/models/semantic_query_builder.rb index 24731d0c..bf884aad 100644 --- a/app/models/semantic_query_builder.rb +++ b/app/models/semantic_query_builder.rb @@ -1,4 +1,7 @@ class SemanticQueryBuilder + # Dedicated exception for Lambda invocation failures (not parsing/validation errors) + class LambdaError < StandardError; end + def build(params, fulltext: false) query_text = params[:q].to_s.strip @@ -13,16 +16,23 @@ def build(params, fulltext: false) def invoke_semantic_builder(query_text) payload = { query: query_text } + function_name = ENV.fetch('TIMDEX_SEMANTIC_BUILDER_FUNCTION_NAME') - response = Timdex::LambdaClient.invoke( - function_name: ENV.fetch('TIMDEX_SEMANTIC_BUILDER_FUNCTION_NAME'), - invocation_type: 'RequestResponse', - payload: payload.to_json - ) + begin + response = Timdex::LambdaClient.invoke( + function_name: function_name, + invocation_type: 'RequestResponse', + payload: payload.to_json + ) + rescue StandardError => e + # All errors from the Lambda service call are wrapped in LambdaError + # so HybridQueryBuilder can catch it and gracefully fall back to lexical search. + raise LambdaError, "Lambda invocation error: #{e.message}", e.backtrace + end + # Response parsing below is outside the rescue block, so JSON/validation errors + # propagate as-is and fail fast rather than triggering graceful fallback. parse_lambda_payload(response.payload) - rescue StandardError => e - raise "Semantic query builder Lambda error: #{e.message}" end def parse_lambda_payload(payload) @@ -39,12 +49,26 @@ def parse_lambda_payload(payload) def parse_lambda_response(lambda_response) # Lambda returns: { "query": { "bool": { "should": [...] } } } - # We extract and return just the inner query object + # We extract and return just the inner query object with keys normalized to symbols raise "Invalid semantic query builder response: missing 'query' key" unless lambda_response.key?('query') query = lambda_response['query'] raise 'Invalid semantic query builder response: query must be a Hash' unless query.is_a?(Hash) - query + # Normalize string keys to symbols for consistency with LexicalQueryBuilder + normalize_keys(query) + end + + # Recursively converts all string keys to symbols in hashes and nested structures. + def normalize_keys(value) + case value + when Hash + value.transform_keys { |k| k.is_a?(String) ? k.to_sym : k } + .transform_values { |v| normalize_keys(v) } + when Array + value.map { |item| normalize_keys(item) } + else + value + end end end diff --git a/config/initializers/lambda.rb b/config/initializers/lambda.rb index 452c58ef..94020ffb 100644 --- a/config/initializers/lambda.rb +++ b/config/initializers/lambda.rb @@ -1,20 +1,17 @@ require 'aws-sdk-lambda' def configure_lambda_client - if ENV['AWS_SESSION_TOKEN'].present? - Aws::Lambda::Client.new( - region: ENV.fetch('AWS_REGION', 'us-east-1'), - access_key_id: ENV.fetch('AWS_ACCESS_KEY_ID'), - secret_access_key: ENV.fetch('AWS_SECRET_ACCESS_KEY'), - session_token: ENV.fetch('AWS_SESSION_TOKEN') - ) - else - Aws::Lambda::Client.new( - region: ENV.fetch('AWS_REGION', 'us-east-1'), - access_key_id: ENV.fetch('AWS_ACCESS_KEY_ID'), - secret_access_key: ENV.fetch('AWS_SECRET_ACCESS_KEY') - ) - end + options = { + region: ENV.fetch('AWS_REGION', 'us-east-1'), + access_key_id: ENV.fetch('AWS_ACCESS_KEY_ID'), + secret_access_key: ENV.fetch('AWS_SECRET_ACCESS_KEY') + } + options[:session_token] = ENV['AWS_SESSION_TOKEN'] if ENV['AWS_SESSION_TOKEN'].present? + + # AWS SDK sets this env in prod. However, we need to conditionally set it for tests so VCR can + # intercept the requests with a fake URL. + options[:endpoint] = ENV['AWS_ENDPOINT_URL_LAMBDA'] if ENV['AWS_ENDPOINT_URL_LAMBDA'].present? + Aws::Lambda::Client.new(options) end Timdex::LambdaClient = configure_lambda_client diff --git a/test/controllers/graphql_controller_test.rb b/test/controllers/graphql_controller_test.rb index 213ae8ab..ece7c64d 100644 --- a/test/controllers/graphql_controller_test.rb +++ b/test/controllers/graphql_controller_test.rb @@ -956,4 +956,110 @@ class GraphqlControllerTest < ActionDispatch::IntegrationTest end end end + + test 'graphql search with queryMode keyword uses lexical builder' do + VCR.use_cassette('opensearch init') do + VCR.use_cassette('graphql search data analytics keyword') do + post '/graphql', params: { query: '{ + search(searchterm: "data analytics", queryMode: "keyword") { + records { + title + score + } + } + }' } + assert_equal(200, response.status) + json = JSON.parse(response.body) + + # Verify results are present with no errors + assert_nil(json['errors']) + assert(json['data']['search']['records'].any?) + end + end + end + + test 'graphql search with queryMode semantic uses semantic builder' do + VCR.use_cassette('opensearch init') do + VCR.use_cassette('graphql search data analytics semantic') do + post '/graphql', params: { query: '{ + search(searchterm: "data analytics", queryMode: "semantic") { + records { + title + } + } + }' } + assert_equal(200, response.status) + json = JSON.parse(response.body) + + # Verify results are present with no errors + assert_nil(json['errors']) + assert(json['data']['search']['records'].any?, 'Expected search results') + end + end + end + + test 'graphql search with queryMode hybrid combines semantic and lexical results' do + VCR.use_cassette('opensearch init') do + VCR.use_cassette('graphql search data analytics hybrid') do + post '/graphql', params: { query: '{ + search(searchterm: "data analytics", queryMode: "hybrid") { + records { + title + score + } + } + }' } + assert_equal(200, response.status) + json = JSON.parse(response.body) + + # Verify results are present with no errors + assert_nil(json['errors']) + assert(json['data']['search']['records'].any?) + end + end + end + + test 'graphql search with filter only (no searchterm) returns filtered results' do + VCR.use_cassette('opensearch init') do + VCR.use_cassette('graphql search title') do + post '/graphql', params: { query: '{ + search(title: "Spice") { + records { + title + } + } + }' } + assert_equal(200, response.status) + json = JSON.parse(response.body) + + # Verify results are present with no errors + assert_nil(json['errors']) + assert(json['data']['search']['records'].any?) + + # Verify results match the filter + assert(json['data']['search']['records'].any? { |r| r['title'].include?('Spice') }) + end + end + end + + test 'graphql search defaults to lexical when queryMode not provided' do + VCR.use_cassette('opensearch init') do + VCR.use_cassette('graphql search data analytics') do + post '/graphql', params: { query: '{ + search(searchterm: "data analytics") { + records { + title + score + } + } + }' } + assert_equal(200, response.status) + json = JSON.parse(response.body) + + # Verify results are present with no errors + assert_nil(json['errors']) + assert(json['data']['search']['records'].any?) + end + end + end end diff --git a/test/models/hybrid_query_builder_test.rb b/test/models/hybrid_query_builder_test.rb new file mode 100644 index 00000000..21a90514 --- /dev/null +++ b/test/models/hybrid_query_builder_test.rb @@ -0,0 +1,310 @@ +require 'test_helper' + +class HybridQueryBuilderTest < ActiveSupport::TestCase + setup do + @builder = HybridQueryBuilder.new + end + + test 'returns lexical query when no searchterm provided' do + params = {} + lexical_result = { + bool: { + should: [], + must: [], + filter: [{ term: { content_type: 'article' } }] + } + } + + lexical_mock = mock + lexical_mock.stubs(:build).returns(lexical_result) + LexicalQueryBuilder.expects(:new).returns(lexical_mock) + + result = @builder.build(params) + + # When q is blank, should return lexical query (preserves filters) + assert_equal lexical_result, result + end + + test 'returns lexical query when searchterm is blank' do + params = { q: '' } + lexical_result = { + bool: { + should: [], + must: [], + filter: [{ term: { content_type: 'article' } }] + } + } + + lexical_mock = mock + lexical_mock.stubs(:build).returns(lexical_result) + LexicalQueryBuilder.expects(:new).returns(lexical_mock) + + result = @builder.build(params) + + assert_equal lexical_result, result + end + + test 'returns lexical query when searchterm is only whitespace' do + params = { q: ' ' } + lexical_result = { + bool: { + should: [], + must: [], + filter: [{ term: { content_type: 'article' } }] + } + } + + lexical_mock = mock + lexical_mock.stubs(:build).returns(lexical_result) + LexicalQueryBuilder.expects(:new).returns(lexical_mock) + + result = @builder.build(params) + + assert_equal lexical_result, result + end + + test 'combines lexical and semantic queries when both succeed' do + params = { q: 'test query' } + + lexical_result = { + bool: { + should: [{ prefix: { title: { value: 'test' } } }], + must: [{ match: { text: { query: 'test' } } }], + filter: [{ term: { content_type: 'article' } }] + } + } + + semantic_result = { + bool: { + should: [ + { rank_feature: { field: 'embedding', boost: 5.0 } } + ] + } + } + + lexical_mock = mock + lexical_mock.stubs(:build).returns(lexical_result) + semantic_mock = mock + semantic_mock.stubs(:build).returns(semantic_result) + LexicalQueryBuilder.expects(:new).returns(lexical_mock) + SemanticQueryBuilder.expects(:new).returns(semantic_mock) + + result = @builder.build(params) + + # Verify hybrid structure contains bool, should, and filter + assert_includes result, :bool + assert_includes result[:bool], :should + assert_includes result[:bool], :filter + assert_equal 2, result[:bool][:should].length + + # The q multi_match must stays inside the lexical branch (not promoted to top) + # so semantic-only matches can be returned. Only filters are at top level. + assert_equal [{ term: { content_type: 'article' } }], result[:bool][:filter] + + # Verify lexical branch contains both should and must (with q multi_match) + lexical_branch = result[:bool][:should][1] + assert_includes lexical_branch, :bool + assert lexical_branch[:bool][:should].present? + assert_equal [{ match: { text: { query: 'test' } } }], lexical_branch[:bool][:must] + end + + test 'preserves filters in hybrid queries' do + params = { q: 'test', content_type_filter: 'article' } + + lexical_result = { + bool: { + should: [{ prefix: { title: { value: 'test' } } }], + must: [], + filter: [{ term: { content_type: 'article' } }] + } + } + + semantic_result = { + bool: { + should: [{ rank_feature: { field: 'embedding', boost: 5.0 } }] + } + } + + lexical_mock = mock + lexical_mock.stubs(:build).returns(lexical_result) + semantic_mock = mock + semantic_mock.stubs(:build).returns(semantic_result) + LexicalQueryBuilder.expects(:new).returns(lexical_mock) + SemanticQueryBuilder.expects(:new).returns(semantic_mock) + + result = @builder.build(params) + + # Filters from lexical should be applied at top level for both branches + assert_equal [{ term: { content_type: 'article' } }], result[:bool][:filter] + + # Both semantic and lexical should be in should clause + assert_equal 2, result[:bool][:should].length + end + + test 'enforces minimum_should_match when filters are present' do + params = { q: 'test', content_type_filter: 'article' } + + lexical_result = { + bool: { + should: [{ prefix: { title: { value: 'test' } } }], + must: [], + filter: [{ term: { content_type: 'article' } }] + } + } + + semantic_result = { + 'bool' => { + 'should' => [{ 'rank_feature' => { 'field' => 'embedding', 'boost' => 5.0 } }] + } + } + + lexical_mock = mock + lexical_mock.stubs(:build).returns(lexical_result) + semantic_mock = mock + semantic_mock.stubs(:build).returns(semantic_result) + LexicalQueryBuilder.expects(:new).returns(lexical_mock) + SemanticQueryBuilder.expects(:new).returns(semantic_mock) + + result = @builder.build(params) + + # With top-level filters present, require at least one semantic/lexical branch + # to match so the query does not degrade into a filter-only match + assert_equal 1, result[:bool][:minimum_should_match] + end + + test 'omits minimum_should_match when no filters' do + params = { q: 'test' } + + lexical_result = { + bool: { + should: [], + must: [], + filter: [] + } + } + + semantic_result = { + bool: { + should: [ + { rank_feature: { field: 'embedding', boost: 5.0 } } + ] + } + } + + lexical_mock = mock + lexical_mock.stubs(:build).returns(lexical_result) + semantic_mock = mock + semantic_mock.stubs(:build).returns(semantic_result) + LexicalQueryBuilder.expects(:new).returns(lexical_mock) + SemanticQueryBuilder.expects(:new).returns(semantic_mock) + + result = @builder.build(params) + + # Without filters, minimum_should_match should not be set + assert_nil result[:bool][:minimum_should_match] + end + + test 'semantic matches still respect non-q filters even without matching q' do + # Verify that non-q filters (title, citation, geo, etc.) are enforced at top level + # so semantic matches must still satisfy them, while the q multi_match stays in lexical. + params = { q: 'climate', title: 'arctic' } + + lexical_result = { + bool: { + should: [{ prefix: { title: { value: 'climate' } } }], + must: [{ multi_match: { query: 'climate', fields: %w[title text] } }], + filter: [{ term: { title: 'arctic' } }] + } + } + + semantic_result = { + bool: { + should: [{ rank_feature: { field: 'embedding', boost: 5.0 } }] + } + } + + lexical_mock = mock + lexical_mock.stubs(:build).returns(lexical_result) + semantic_mock = mock + semantic_mock.stubs(:build).returns(semantic_result) + LexicalQueryBuilder.expects(:new).returns(lexical_mock) + SemanticQueryBuilder.expects(:new).returns(semantic_mock) + + result = @builder.build(params) + + # Non-q filters (e.g., title='arctic') are at top level so both semantic and lexical + # branches must satisfy them. Semantic-only matches matching 'climate' in embeddings + # can still be returned, as long as they have title='arctic'. + assert_equal [{ term: { title: 'arctic' } }], result[:bool][:filter] + assert_equal 2, result[:bool][:should].length + + # The q multi_match stays inside the lexical branch (not at top level), + # allowing semantic-only matches that don't match the q query but do match filters. + lexical_branch = result[:bool][:should][1] + assert_includes lexical_branch[:bool], :must + assert(lexical_branch[:bool][:must].any? { |c| c.key?(:multi_match) }) + + # minimum_should_match enforced since filters present + assert_equal 1, result[:bool][:minimum_should_match] + end + + test 'semantic query has symbol keys from semantic builder' do + params = { q: 'test' } + + lexical_result = { + bool: { + should: [], + must: [], + filter: [] + } + } + + # SemanticQueryBuilder now normalizes keys to symbols before returning + semantic_result = { + bool: { + should: [ + { rank_feature: { field: 'embedding', boost: 5.0 } } + ] + } + } + + lexical_mock = mock + lexical_mock.stubs(:build).returns(lexical_result) + semantic_mock = mock + semantic_mock.stubs(:build).returns(semantic_result) + LexicalQueryBuilder.expects(:new).returns(lexical_mock) + SemanticQueryBuilder.expects(:new).returns(semantic_mock) + + result = @builder.build(params) + + # Verify semantic query in should clause has symbol keys (normalized at source) + semantic_query = result[:bool][:should][0] + semantic_query.each_key { |k| assert k.is_a?(Symbol), "Expected symbol key, got #{k.inspect}" } + semantic_query[:bool].each_key { |k| assert k.is_a?(Symbol), "Expected symbol key, got #{k.inspect}" } + end + + test 'gracefully uses lexical when semantic builder raises LambdaError' do + params = { q: 'test query' } + + lexical_result = { + bool: { + should: [{ prefix: { title: { value: 'test' } } }], + must: [{ match: { text: { query: 'test' } } }], + filter: [] + } + } + + lexical_mock = mock + lexical_mock.stubs(:build).returns(lexical_result) + semantic_mock = mock + # SemanticQueryBuilder now raises SemanticQueryBuilder::LambdaError for Lambda failures + semantic_mock.stubs(:build).raises(SemanticQueryBuilder::LambdaError.new('service unavailable')) + LexicalQueryBuilder.expects(:new).returns(lexical_mock) + SemanticQueryBuilder.expects(:new).returns(semantic_mock) + + result = @builder.build(params) + + # When semantic fails with Lambda error, fall back to lexical + assert_equal lexical_result, result + end +end diff --git a/test/models/opensearch_test.rb b/test/models/opensearch_test.rb index f7eddace..45235435 100644 --- a/test/models/opensearch_test.rb +++ b/test/models/opensearch_test.rb @@ -139,4 +139,26 @@ class OpensearchTest < ActiveSupport::TestCase result = os.query assert_equal(mock_response, result) end + + test 'uses HybridQueryBuilder when queryMode is hybrid' do + os = Opensearch.new + os.instance_variable_set(:@params, { q: 'test' }) + os.instance_variable_set(:@fulltext, false) + os.instance_variable_set(:@query_mode, 'hybrid') + + mock_response = { + bool: { + should: [ + { bool: { should: [{ rank_feature: { field: 'test', boost: 1.0 } }] } }, + { bool: { must: [{ match: { text: { query: 'test' } } }] } } + ] + } + } + mock_builder = mock + mock_builder.stubs(:build).returns(mock_response) + HybridQueryBuilder.expects(:new).once.returns(mock_builder) + + result = os.query + assert_equal(mock_response, result) + end end diff --git a/test/models/semantic_query_builder_test.rb b/test/models/semantic_query_builder_test.rb index 6452927a..f11ef85d 100644 --- a/test/models/semantic_query_builder_test.rb +++ b/test/models/semantic_query_builder_test.rb @@ -53,10 +53,10 @@ def setup_mock_lambda(response_data) result = @builder.build(params) expected_query = { - 'bool' => { - 'should' => [ - { 'rank_feature' => { 'field' => 'embedding_full_record.hello', 'boost' => 6.94 } }, - { 'rank_feature' => { 'field' => 'embedding_full_record.world', 'boost' => 3.42 } } + bool: { + should: [ + { rank_feature: { field: 'embedding_full_record.hello', boost: 6.94 } }, + { rank_feature: { field: 'embedding_full_record.world', boost: 3.42 } } ] } } @@ -70,7 +70,7 @@ def setup_mock_lambda(response_data) params = { q: query_text } - assert_raises(RuntimeError) do + assert_raises(SemanticQueryBuilder::LambdaError) do @builder.build(params) end end diff --git a/test/vcr_cassettes/graphql_search_data_analytics_hybrid.yml b/test/vcr_cassettes/graphql_search_data_analytics_hybrid.yml new file mode 100644 index 00000000..25a7fe38 --- /dev/null +++ b/test/vcr_cassettes/graphql_search_data_analytics_hybrid.yml @@ -0,0 +1,167 @@ +--- +http_interactions: +- request: + method: post + uri: http://localhost:9200/2015-03-31/functions/timdex-semantic-builder-prod:live/invocations + body: + encoding: UTF-8 + string: '{"query":"data analytics"}' + headers: + Accept-Encoding: + - '' + Amz-Sdk-Invocation-Id: + - 22445a90-dcae-4bdd-a031-fdbb81f937c8 + X-Amz-Invocation-Type: + - RequestResponse + Content-Type: + - application/octet-stream + Host: + - localhost:9200 + X-Amz-Date: + - 20260430T224732Z + X-Amz-Content-Sha256: + - "" + Authorization: + - "" + User-Agent: + - aws-sdk-ruby3/3.244.0 ua/2.1 api/lambda#1.177.0 os/macos#25 md/arm64 lang/ruby#3.4.9 + md/3.4.9 m/Z,b,D,n + Content-Length: + - '26' + Accept: + - "*/*" + response: + status: + code: 200 + message: OK + headers: + Date: + - Thu, 30 Apr 2026 22:47:33 GMT + Content-Type: + - application/json + Content-Length: + - '360' + Connection: + - keep-alive + X-Amzn-Requestid: + - 58e5c83f-6e1b-463b-ac42-c3e9f4d423f4 + X-Amzn-Remapped-Content-Length: + - '0' + X-Amz-Executed-Version: + - '2' + X-Amzn-Trace-Id: + - Root=1-69f3dc04-40305ad2014d472b1e14c05d;Parent=773d772808703f5f;Sampled=0;Lineage=1:75f47734:0 + body: + encoding: UTF-8 + string: '{"query": {"bool": {"should": [{"rank_feature": {"field": "embedding_full_record.[CLS]", + "boost": 1.0}}, {"rank_feature": {"field": "embedding_full_record.[SEP]", + "boost": 1.0}}, {"rank_feature": {"field": "embedding_full_record.data", "boost": + 3.960404872894287}}, {"rank_feature": {"field": "embedding_full_record.analytics", + "boost": 7.998181343078613}}]}}}' + recorded_at: Thu, 30 Apr 2026 22:47:33 GMT +- request: + method: get + uri: http://localhost:9200/ + body: + encoding: US-ASCII + string: '' + headers: + User-Agent: + - 'opensearch-ruby/3.4.0 (RUBY_VERSION: 3.4.9; darwin arm64; Faraday v2.14.0)' + Content-Type: + - application/json + Host: + - localhost:9200 + X-Amz-Date: + - 20260430T224733Z + X-Amz-Content-Sha256: + - "" + Authorization: + - "" + Accept-Encoding: + - gzip;q=1.0,deflate;q=0.6,identity;q=0.3 + Accept: + - "*/*" + response: + status: + code: 200 + message: OK + headers: + Date: + - Thu, 30 Apr 2026 22:47:33 GMT + Content-Type: + - application/json; charset=UTF-8 + Content-Length: + - '530' + Connection: + - keep-alive + Access-Control-Allow-Origin: + - "*" + body: + encoding: ASCII-8BIT + string: | + { + "name" : "ae9b9f33323987525821fa9157e5c549", + "cluster_name" : "300442551476:timdex-prod", + "cluster_uuid" : "TPxigA0nQoaOlMKPYgIulw", + "version" : { + "number" : "7.10.2", + "build_type" : "tar", + "build_hash" : "unknown", + "build_date" : "2025-07-17T22:19:57.927928316Z", + "build_snapshot" : false, + "lucene_version" : "9.12.1", + "minimum_wire_compatibility_version" : "7.10.0", + "minimum_index_compatibility_version" : "7.0.0" + }, + "tagline" : "The OpenSearch Project: https://opensearch.org/" + } + recorded_at: Thu, 30 Apr 2026 22:47:33 GMT +- request: + method: post + uri: http://localhost:9200/all-current/_search + body: + encoding: UTF-8 + string: '{"from":"0","size":20,"query":{"bool":{"should":[{"bool":{"should":[{"rank_feature":{"field":"embedding_full_record.[CLS]","boost":1.0}},{"rank_feature":{"field":"embedding_full_record.[SEP]","boost":1.0}},{"rank_feature":{"field":"embedding_full_record.data","boost":3.960404872894287}},{"rank_feature":{"field":"embedding_full_record.analytics","boost":7.998181343078613}}]}},{"bool":{"should":[{"prefix":{"title.exact_value":{"value":"data + analytics","boost":15.0}}},{"term":{"title":{"value":"data analytics","boost":1.0}}},{"nested":{"path":"contributors","query":{"term":{"contributors.value":{"value":"data + analytics","boost":0.1}}}}}],"must":[{"multi_match":{"query":"data analytics","fields":["alternate_titles","call_numbers","citation","contents","contributors.value","dates.value","edition","funding_information.*","identifiers.value","languages","locations.value","notes.value","numbering","publication_information","subjects.value","summary","title"],"minimum_should_match":"0%"}}]}}]}},"aggregations":{"access_to_files":{"nested":{"path":"rights"},"aggs":{"only_file_access":{"filter":{"terms":{"rights.kind":["Access + to files"]}},"aggs":{"access_types":{"terms":{"field":"rights.description.keyword"}}}}}},"contributors":{"nested":{"path":"contributors"},"aggs":{"contributor_names":{"terms":{"field":"contributors.value.keyword"}}}},"content_type":{"terms":{"field":"content_type"}},"content_format":{"terms":{"field":"format"}},"languages":{"terms":{"field":"languages.keyword"}},"literary_form":{"terms":{"field":"literary_form"}},"places":{"nested":{"path":"subjects"},"aggs":{"only_spatial":{"filter":{"terms":{"subjects.kind":["Dublin + Core; Spatial"]}},"aggs":{"place_names":{"terms":{"field":"subjects.value.keyword"}}}}}},"source":{"terms":{"field":"source"}},"subjects":{"nested":{"path":"subjects"},"aggs":{"subject_names":{"terms":{"field":"subjects.value.keyword"}}}}},"sort":[{"_score":{"order":"desc"}},{"dates.value.as_date":{"order":"desc","nested":{"path":"dates"}}}]}' + headers: + User-Agent: + - 'opensearch-ruby/3.4.0 (RUBY_VERSION: 3.4.9; darwin arm64; Faraday v2.14.0)' + Content-Type: + - application/json + Host: + - localhost:9200 + X-Amz-Date: + - 20260430T224733Z + X-Amz-Content-Sha256: + - "" + Authorization: + - "" + Accept-Encoding: + - gzip;q=1.0,deflate;q=0.6,identity;q=0.3 + Accept: + - "*/*" + response: + status: + code: 200 + message: OK + headers: + Date: + - Thu, 30 Apr 2026 22:47:37 GMT + Content-Type: + - application/json; charset=UTF-8 + Content-Length: + - '97013' + Connection: + - keep-alive + Access-Control-Allow-Origin: + - "*" + body: + encoding: ASCII-8BIT + string: !binary |- + {"took":3305,"timed_out":false,"_shards":{"total":23,"successful":23,"skipped":0,"failed":0},"hits":{"total":{"value":10000,"relation":"gte"},"max_score":null,"hits":[{"_index":"alma-2025-03-01t03-00-02","_id":"alma:9935181015606761","_score":32.33303,"_source":{"source":"MIT Alma","source_link":"https://mit.primo.exlibrisgroup.com/discovery/fulldisplay?vid=01MIT_INST:MIT&docid=alma9935181015606761","timdex_record_id":"alma:9935181015606761","title":"Data analytics and big data","call_numbers":["QA76.9.B45","005.7"],"citation":"Sedkaoui, Soraya (2018): Data analytics and big data. Hoboken, New Jersey : ISTE Ltd/John Wiley and Sons Inc. Language material. https://mit.primo.exlibrisgroup.com/discovery/fulldisplay?vid=01MIT_INST:MIT&docid=alma9935181015606761","content_type":["Language material"],"contents":["Cover","Half-Title Page","Dedication","Title Page","Copyright Page","Contents","Acknowledgments","Preface","Introduction","Why this book?","Whom is this book for?","Organization of the book","Glossary","PART 1 Towards an Understanding of Big Data:Are You Ready?","1. From Data to Big Data: You Must Walk Before You Can Run","1.1. Introduction","1.2. No analytics without data","1.2.1. Databases","1.2.2. Raw data","1.2.3. Text","1.2.4. Images, audios and videos","1.2.5. The Internet of Things","1.3. From bytes to yottabytes: the data revolution","1.4. Big data: definition","1.5. The 3Vs model","1.6. Why now and what does it bring?","1.7. Conclusions","2. Big Data: A Revolution that Changes the Game","2.1. Introduction","2.2. Beyond the 3Vs","2.3. From understanding data to knowledge","2.4. Improving decision-making","2.5. Things to take into account","2.5.1. Data complexity","2.5.2. Data quality: look out! Not all data are the right data","2.5.3. What else?…Data security","2.6. Big data and businesses","2.6.1. Opportunities","2.6.2. Challenges","2.7. Conclusions","PART 2 Big Data Analytics: A Compilation of Advanced Analytics Techniques that Covers a Wide Range of Data","3. Building an Understanding of Big Data Analytics","3.1. Introduction","3.2. Before breaking down the process… What is data analytics?","3.3. Before and after big data analytics","3.4. Traditional versus advanced analytics: What is the difference?","3.5. Advanced analytics: new paradigm","3.6. New statistical and computational paradigm within the big data context","3.7. Conclusions","4. Why Data Analytics and When Can We Use It?","4.1. Introduction","4.2. Understanding the changes in context","4.3. When real time makes the difference","4.4. What should data analytics address?","4.5. Analytics culture within companies","4.6. Big data analytics application: examples","4.7. Conclusions","5. Data Analytics Process: There's Great Work Behind the Scenes","5.1. Introduction","5.2. More data, more questions for better answers","5.2.1. We can never say it enough: \"there is no good wind for those who don't know where they are going\"","5.2.2. Understanding the basics: identify what we already know and what we have yet to find out","5.2.3. Defining the tasks to be accomplished","5.2.4. Which technology to adopt?","5.2.5. Understanding data analytics is good but knowing how to use it is better! (What skills do you need?)","5.2.6. What does the data project cost and how will it pay off in time?","5.2.7. What will it mean to you once you find out?","5.3. Next steps: do you have an idea about a \"secret sauce\"?","5.3.1. First phase: find the data (data collection)","5.3.2. Second phase: construct the data (data preparation)","5.3.3. Third phase: go to exploration and modeling (data analysis)","5.3.4. Fourth phase: evaluate and interpret the results (evaluation and interpretation)","5.3.5. Fifth phase: transform data into actionable knowledge (deploy the model)","5.4. Disciplines that support the big data analytics process","5.4.1. Statistics","5.4.2. Machine learning","5.4.3. Data mining","5.4.4. Text mining","5.4.5. Database management systems","5.4.6. Data streams management systems","5.5. Wait, it's not so simple: what to avoid when building a","5.5.1. Minimize the model error","5.5.2. Maximize the likelihood of the model","5.5.3. What about surveys?","5.6. Conclusions","PART 3 Data Analytics and Machine Learning: the Relevance of Algorithms","6. Machine Learning: a Method of Data Analysis that Automates Analytical Model Building","6.1. Introduction","6.2. From simple descriptive analysis to predictive and prescriptive analyses: what are the different steps?","6.3. Artificial intelligence: algorithms and techniques","6.4. ML: what is it?","6.5. Why is it important?","6.6. How does ML work?","6.6.1. Definition the business need (problem statement) and its formalization","6.6.2. Collection and preparation of the useful data that will be used to meet this need","6.6.3. Test the performance of the obtained model","6.6.4. Optimization and production start","6.7. Data scientist: the new alchemist","6.8. Conclusion","7. Supervised versus Unsupervised Algorithms: a Guided Tour","7.1. Introduction","7.2. Supervised and unsupervised learning","7.2.1. Supervised learning: predict, predict and predict!","7.2.2. Unsupervised learning: go to profiles search!","7.3. Regression versus classification","7.3.1. Regression","7.3.2. Classification","7.4. Clustering gathers data","7.4.1. What good could it serve?","7.4.2. Principle of clustering algorithms","7.4.3. Partitioning your data by using the K-means algorithm","7.5. Conclusion","8. Applications and Examples","8.1. Introduction","8.2. Which algorithm to use?","8.2.1. Supervised or unsupervised algorithm: in which case do we use each one?","8.2.2. What about other ML algorithms?","8.3. The duo big data/ML: examples of use","8.3.1. Netflix: show me what you are looking at and I'll personalize what you like","8.3.2. Amazon: when AI comes into your everyday life","8.3.3. And more: proof that data are a source of creativity","8.4. Conclusions","Bibliography","Index","Other titles from iSTE in Computer Engineering","EULA"],"contributors":[{"value":"Sedkaoui, Soraya","kind":"author"}],"dates":[{"kind":"Publication date","value":"2018"}],"edition":"1st ed.","holdings":[{"collection":"Wiley Online Library","format":"electronic resource","location":"https://na06.alma.exlibrisgroup.com/view/uresolver/01MIT_INST/openurl?u.ignore_date_coverage=true&portfolio_pid=53636613240006761&Force_direct=true"}],"identifiers":[{"value":"9781119528067","kind":"ISBN"},{"value":"1119528062","kind":"ISBN"},{"value":"9781119528050","kind":"ISBN"},{"value":"1119528054","kind":"ISBN"},{"value":"9781119528043","kind":"ISBN"},{"value":"1119528046","kind":"ISBN"},{"value":"(CKB)4100000004385186","kind":"OCLC Number"},{"value":"(Au-PeEL)EBL5401178","kind":"OCLC Number"},{"value":"(CaPaEBR)ebr11564831","kind":"OCLC Number"},{"value":"(PPN)236433105","kind":"OCLC Number"},{"value":"1037945978","kind":"OCLC Number"},{"value":"(MiAaPQ)EBC5401178","kind":"OCLC Number"},{"value":"(Perlego)996164","kind":"OCLC Number"},{"value":"(EXLCZ)994100000004385186","kind":"OCLC Number"}],"languages":["English"],"links":[{"url":"https://na06.alma.exlibrisgroup.com/view/uresolver/01MIT_INST/openurl?u.ignore_date_coverage=true&portfolio_pid=53636613240006761&Force_direct=true","kind":"Digital object URL","text":"Wiley Online Library"}],"literary_form":"Nonfiction","locations":[{"value":"New Jersey","kind":"Place of Publication"},{"value":"Hoboken, New Jersey","kind":"Place of Publication"}],"notes":[{"value":["Soraya Sedkaoui"],"kind":"Title Statement of Responsibility"},{"value":["Includes bibliographical references and index"],"kind":"Bibliography Note"},{"value":["Description based on print version record"],"kind":"Source of Description Note"}],"physical_description":"1 online resource (225 pages)","publishers":[{"name":"ISTE Ltd/John Wiley and Sons Inc","date":"2018","location":"Hoboken, New Jersey"}],"subjects":[{"value":["Big data"],"kind":"Topical Term"},{"value":["Databases"],"kind":"Topical Term"},{"value":["Database management"],"kind":"Topical Term"}],"summary":["The main purpose of this book is to investigate, explore and describe approaches and methods to facilitate data understanding through analytics solutions based on its principles, concepts and applications. But analyzing data is also about involving the use of software. For this, and in order to cover some aspect of data analytics, this book uses software (Excel, SPSS, Python, etc) which can help readers to better understand the analytics process in simple terms and supporting useful methods in its application. "],"timdex_provenance":{"source":"alma","run_date":"2025-04-14","run_id":"alma-daily-ingest-2025-04-14t08-28-27","run_record_offset":5691}},"sort":[32.33303,1514764800000]},{"_index":"alma-2025-03-01t03-00-02","_id":"alma:9936024273806761","_score":32.0439,"_source":{"source":"MIT Alma","source_link":"https://mit.primo.exlibrisgroup.com/discovery/fulldisplay?vid=01MIT_INST:MIT&docid=alma9936024273806761","timdex_record_id":"alma:9936024273806761","title":"Data Analytics Initiatives  : Managing Analytics for Success","call_numbers":["P53.755","001.42"],"citation":"Data Analytics Initiatives  : Managing Analytics for Success. 2022. Milton : Auerbach Publishers, Incorporated. Language material. https://mit.primo.exlibrisgroup.com/discovery/fulldisplay?vid=01MIT_INST:MIT&docid=alma9936024273806761","content_type":["Language material"],"contributors":[{"value":"Bothe, Ondřej","kind":"Not specified"},{"value":"Kubera, Ondřej","kind":"Not specified"},{"value":"Bednář, David","kind":"Not specified"},{"value":"Potančok, Martin","kind":"Not specified"},{"value":"Novotný, Ota","kind":"Not specified"}],"dates":[{"kind":"Publication date","value":"2022"}],"holdings":[{"collection":"Taylor & Francis Discovery Collection","format":"electronic resource","location":"https://www.taylorfrancis.com/books/9781003304081"}],"identifiers":[{"value":"9781000629347","kind":"ISBN"},{"value":"1000629341","kind":"ISBN"},{"value":"9781000629293. (electronic bk.)","kind":"ISBN"},{"value":"1000629295. (electronic bk.)","kind":"ISBN"},{"value":"9781003304081. (electronic bk.)","kind":"ISBN"},{"value":"1003304087. (electronic bk.)","kind":"ISBN"},{"value":"10.1201/9781003304081. doi","kind":"Other Identifier"},{"value":"tayfra9781003304081","kind":"OCLC Number"},{"value":"(NhCcYBP)tayfra9781003304081","kind":"OCLC Number"}],"languages":["English"],"links":[{"url":"https://www.taylorfrancis.com/books/9781003304081","kind":"Digital object URL"},{"url":"https://www.taylorfrancis.com/books/9781003304081","kind":"Digital object URL","text":"Taylor & Francis Discovery Collection"}],"literary_form":"Nonfiction","locations":[{"value":"No place, unknown, or undetermined","kind":"Place of Publication"},{"value":"Milton","kind":"Place of Publication"}],"notes":[{"value":["Description based upon print version of record"],"kind":"General Note"}],"physical_description":"1 online resource (164 p.)","publishers":[{"name":"Auerbach Publishers, Incorporated","date":"2022","location":"Milton"}],"subjects":[{"value":["Quantitative research"],"kind":"Topical Term"},{"value":["Research - Data processing"],"kind":"Topical Term"}],"summary":["The categorisation of analytical projects could help to simplify complexity reasonably and, at the same time, clarify the critical aspects of analytical initiatives. But how can this complex work be categorized? What makes it so complex? Data Analytics Initiatives: Managing Analytics for Success emphasizes that each analytics project is different. At the same time, analytics projects have many common aspects, and these features make them unique compared to other projects. Describing these commonalities helps to develop a conceptual understanding of analytical work. However, features specific to each initiative affects the entire analytics project lifecycle. Neglecting them by trying to use general approaches without tailoring them to each project can lead to failure. In addition to examining typical characteristics of the analytics project and how to categorise them, the book looks at specific types of projects, provides a high-level assessment of their characteristics from a risk perspective, and comments on the most common problems or challenges. The book also presents examples of questions that could be asked of relevant people to analyse an analytics project. These questions help to position properly the project and to find commonalities and general project challenges."],"timdex_provenance":{"source":"alma","run_date":"2026-02-07","run_id":"alma-daily-ingest-2026-02-07t09-21-29","run_record_offset":23276}},"sort":[32.0439,1640995200000]},{"_index":"alma-2025-03-01t03-00-02","_id":"alma:9936019383706761","_score":31.494576,"_source":{"source":"MIT Alma","source_link":"https://mit.primo.exlibrisgroup.com/discovery/fulldisplay?vid=01MIT_INST:MIT&docid=alma9936019383706761","timdex_record_id":"alma:9936019383706761","title":"Data Analytics in Finance","call_numbers":["HG104","332.0285"],"citation":"Data Analytics in Finance. 2025. Boca Raton : CRC Press, Taylor & Francis Group. Language material. https://mit.primo.exlibrisgroup.com/discovery/fulldisplay?vid=01MIT_INST:MIT&docid=alma9936019383706761","content_type":["Language material"],"contributors":[{"value":"Dong, Juijian","kind":"Not specified"}],"dates":[{"kind":"Publication date","value":"2025"}],"edition":"First edition.","holdings":[{"collection":"Taylor & Francis Discovery Collection","format":"electronic resource","location":"https://www.taylorfrancis.com/books/9781003620198"}],"identifiers":[{"value":"1040349749. electronic book","kind":"ISBN"},{"value":"9781040349748. electronic book","kind":"ISBN"},{"value":"9781003620198. electronic book","kind":"ISBN"},{"value":"1003620191. electronic book","kind":"ISBN"},{"value":"9781040349687. electronic book","kind":"ISBN"},{"value":"1040349684. electronic book","kind":"ISBN"},{"value":"10.1201/9781003620198. doi","kind":"Other Identifier"},{"value":"tayfra9781003620198","kind":"OCLC Number"},{"value":"(NhCcYBP)tayfra9781003620198","kind":"OCLC Number"}],"languages":["English"],"links":[{"url":"https://www.taylorfrancis.com/books/9781003620198","kind":"Digital object URL"},{"url":"https://www.taylorfrancis.com/books/9781003620198","kind":"Digital object URL","text":"Taylor & Francis Discovery Collection"}],"literary_form":"Nonfiction","locations":[{"value":"Florida","kind":"Place of Publication"},{"value":"Boca Raton","kind":"Place of Publication"}],"notes":[{"value":["Huijian Dong"],"kind":"Title Statement of Responsibility"},{"value":["\"An Auerbach Book.\""],"kind":"General Note"},{"value":["Includes bibliographical references and index"],"kind":"Bibliography Note"},{"value":["Description based on online resource; title from digital title page (viewed on April 28, 2025)"],"kind":"Source of Description Note"}],"physical_description":"1 online resource","publishers":[{"name":"CRC Press, Taylor & Francis Group","date":"2025","location":"Boca Raton"}],"related_items":[{"description":"Data analytics applications","relationship":"In Series"}],"subjects":[{"value":["Finance - Data processing"],"kind":"Topical Term"}],"summary":["Data Analytics in Finance covers the methods and application of data analytics in all major areas of finance, including buy-side investments, sell-side investment banking, corporate finance, consumer finance, financial services, real estate, insurance, and commercial banking. It explains statistical inference of big data, financial modeling, machine learning, database querying, data engineering, data visualization, and risk analysis. Emphasizing financial data analytics practices with a solution- oriented purpose, it is a \"one-stop-shop\" of all the major data analytics aspects for each major finance area.The book paints a comprehensive picture of the data analytics process including: Statistical inference of big data Financial modeling Machine learning and AI Database querying Data engineering Data visualization Risk analysis Each chapter is crafted to provide complete guidance for many subject areas including investments, fraud detection, and consumption finance. Avoiding data analytics methods widely available elsewhere, the book focuses on providing data analytics methods specifically applied to key areas of finance. Written as a roadmap for researchers, practitioners, and students to master data analytics instruments in finance, the book also provides a collection of indispensable resources for the readers' reference. Offering the knowledge and tools necessary to thrive in a data-driven financial landscape, this book enables readers to deepen their understanding of investments, develop new approaches to risk management, and apply data analytics to finance."],"timdex_provenance":{"source":"alma","run_date":"2026-02-07","run_id":"alma-daily-ingest-2026-02-07t09-21-29","run_record_offset":24583}},"sort":[31.494576,1735689600000]},{"_index":"alma-2025-03-01t03-00-02","_id":"alma:9935705087506761","_score":31.494576,"_source":{"source":"MIT Alma","source_link":"https://mit.primo.exlibrisgroup.com/discovery/fulldisplay?vid=01MIT_INST:MIT&docid=alma9935705087506761","timdex_record_id":"alma:9935705087506761","title":"Data Analytics in Spectroscopy","call_numbers":["Q342","006.3"],"citation":"Dubrovkin, Joseph (2024): Data Analytics in Spectroscopy. Newcastle upon Tyne, England : Cambridge Scholars Publishing. Language material. https://mit.primo.exlibrisgroup.com/discovery/fulldisplay?vid=01MIT_INST:MIT&docid=alma9935705087506761","content_type":["Language material"],"contents":["Intro","Table of Contents","Preface","About the Structure of the Book","Abbreviations","PART I","Introduction","Chapter One","Chapter Two","Chapter Three","Chapter Four","Conclusion","PART II","PART III","Chapter Five","PART IV","Afterword","Appendix A","Appendix B","Appendix C","Appendix D","Appendix E","Appendix F","Appendix G","Appendix H","Appendix I","Bibliography","Index"],"contributors":[{"value":"Dubrovkin, Joseph","kind":"author"}],"dates":[{"kind":"Publication date","value":"2024"}],"edition":"First edition.","holdings":[{"collection":"Ebook Central Perpetual, DDA and Subscription Titles","format":"electronic resource","location":"https://na06.alma.exlibrisgroup.com/view/uresolver/01MIT_INST/openurl?u.ignore_date_coverage=true&portfolio_pid=53692164220006761&Force_direct=true"}],"identifiers":[{"value":"1-5275-8037-7","kind":"ISBN"},{"value":"(MiAaPQ)EBC31136556","kind":"OCLC Number"},{"value":"(Au-PeEL)EBL31136556","kind":"OCLC Number"},{"value":"(EXLCZ)9930322696600041","kind":"OCLC Number"}],"languages":["English"],"links":[{"url":"https://na06.alma.exlibrisgroup.com/view/uresolver/01MIT_INST/openurl?u.ignore_date_coverage=true&portfolio_pid=53692164220006761&Force_direct=true","kind":"Digital object URL","text":"Ebook Central Perpetual, DDA and Subscription Titles"}],"literary_form":"Nonfiction","locations":[{"value":"England","kind":"Place of Publication"},{"value":"Newcastle upon Tyne, England","kind":"Place of Publication"}],"notes":[{"value":["Joseph Dubrovkin"],"kind":"Title Statement of Responsibility"},{"value":["Includes bibliographical references and index"],"kind":"Bibliography Note"},{"value":["Description based on print version record"],"kind":"Source of Description Note"}],"physical_description":"1 online resource (510 pages)","publishers":[{"name":"Cambridge Scholars Publishing","date":"[2024]","location":"Newcastle upon Tyne, England"},{"date":"©2024"}],"subjects":[{"value":["Computational intelligence"],"kind":"Topical Term"},{"value":["Artificial intelligence"],"kind":"Topical Term"},{"value":["Biomedical engineering"],"kind":"Topical Term"}],"summary":["This textbook summarizes various studies and significant materials on data analytics in spectroscopy. Its rigorous mathematical basis, in-depth description, and numerous examples of applications in chemistry and physics make this book valuable for theorists, practitioners, and students specializing in data processing in spectroscopy, chemometrics, and analytical chemistry.The bibliography briefly describes hundreds of data analytics applications for solving spectroscopic tasks in industrial and research laboratories. This book differs from existing brief reviews and articles on this topic in that it forms, for the first time, the big picture of all kinds of data analytics methods in spectroscopy. The book also provides quickly reproducible computer calculations to illustrate its significant theoretical statements. As such, it can also serve as a practical guide to lecturers in data analytics in the broad field of spectroscopy, including chemometrics and analytical chemistry."],"timdex_provenance":{"source":"alma","run_date":"2025-09-26","run_id":"alma-daily-ingest-2025-09-26t08-22-09","run_record_offset":2063}},"sort":[31.494576,1704067200000]},{"_index":"alma-2025-03-01t03-00-02","_id":"alma:9936020329006761","_score":31.494576,"_source":{"source":"MIT Alma","source_link":"https://mit.primo.exlibrisgroup.com/discovery/fulldisplay?vid=01MIT_INST:MIT&docid=alma9936020329006761","timdex_record_id":"alma:9936020329006761","title":"Data Analytics in Spectroscopy","call_numbers":["Q342","006.3"],"citation":"Dubrovkin, Joseph (2024): Data Analytics in Spectroscopy. Newcastle upon Tyne, England : Cambridge Scholars Publishing. Language material. https://mit.primo.exlibrisgroup.com/discovery/fulldisplay?vid=01MIT_INST:MIT&docid=alma9936020329006761","content_type":["Language material"],"contents":["Intro","Table of Contents","Preface","About the Structure of the Book","Abbreviations","PART I","Introduction","Chapter One","Chapter Two","Chapter Three","Chapter Four","Conclusion","PART II","PART III","Chapter Five","PART IV","Afterword","Appendix A","Appendix B","Appendix C","Appendix D","Appendix E","Appendix F","Appendix G","Appendix H","Appendix I","Bibliography","Index"],"contributors":[{"value":"Dubrovkin, Joseph","kind":"author"}],"dates":[{"kind":"Publication date","value":"2024"}],"edition":"First edition.","holdings":[{"collection":"Taylor & Francis Discovery Collection","format":"electronic resource","location":"https://www.taylorfrancis.com/books/9781042824519"}],"identifiers":[{"value":"1527580377","kind":"ISBN"},{"value":"9781527580374","kind":"ISBN"},{"value":"tayfra9781042824519","kind":"OCLC Number"},{"value":"(NhCcYBP)tayfra9781042824519","kind":"OCLC Number"}],"languages":["English"],"links":[{"url":"https://www.taylorfrancis.com/books/9781042824519","kind":"Digital object URL"},{"url":"https://www.taylorfrancis.com/books/9781042824519","kind":"Digital object URL","text":"Taylor & Francis Discovery Collection"}],"literary_form":"Nonfiction","locations":[{"value":"England","kind":"Place of Publication"},{"value":"Newcastle upon Tyne, England","kind":"Place of Publication"}],"notes":[{"value":["Joseph Dubrovkin"],"kind":"Title Statement of Responsibility"},{"value":["Includes bibliographical references and index"],"kind":"Bibliography Note"},{"value":["Description based on print version record"],"kind":"Source of Description Note"}],"physical_description":"1 online resource (510 pages)","publishers":[{"name":"Cambridge Scholars Publishing","date":"[2024]","location":"Newcastle upon Tyne, England"},{"date":"©2024"}],"subjects":[{"value":["Computational intelligence"],"kind":"Topical Term"},{"value":["Artificial intelligence"],"kind":"Topical Term"},{"value":["Biomedical engineering"],"kind":"Topical Term"}],"summary":["This textbook summarizes various studies and significant materials on data analytics in spectroscopy. Its rigorous mathematical basis, in-depth description, and numerous examples of applications in chemistry and physics make this book valuable for theorists, practitioners, and students specializing in data processing in spectroscopy, chemometrics, and analytical chemistry.The bibliography briefly describes hundreds of data analytics applications for solving spectroscopic tasks in industrial and research laboratories. This book differs from existing brief reviews and articles on this topic in that it forms, for the first time, the big picture of all kinds of data analytics methods in spectroscopy. The book also provides quickly reproducible computer calculations to illustrate its significant theoretical statements. As such, it can also serve as a practical guide to lecturers in data analytics in the broad field of spectroscopy, including chemometrics and analytical chemistry."],"timdex_provenance":{"source":"alma","run_date":"2026-02-07","run_id":"alma-daily-ingest-2026-02-07t09-21-29","run_record_offset":56300}},"sort":[31.494576,1704067200000]},{"_index":"alma-2025-03-01t03-00-02","_id":"alma:9935427370706761","_score":31.494576,"_source":{"source":"MIT Alma","source_link":"https://mit.primo.exlibrisgroup.com/discovery/fulldisplay?vid=01MIT_INST:MIT&docid=alma9935427370706761","timdex_record_id":"alma:9935427370706761","title":"Data analytics for cybersecurity","call_numbers":["QA76.9.A25","005.8"],"citation":"Janeja, Vandana P (2022): Data analytics for cybersecurity. Cambridge ; New York, NY : Cambridge University Press. Language material. https://mit.primo.exlibrisgroup.com/discovery/fulldisplay?vid=01MIT_INST:MIT&docid=alma9935427370706761","content_type":["Language material"],"contents":["Introduction - data analytics for cybersecurity","Understanding sources of cybersecurity data","Introduction to data mining : clustering, classification and association rule mining","Big data analytics and its need for cybersecurity","Types of cyber attacks","Anomaly detection for cyber security","Anomaly detection","Cybersecurity through time series and spatial data","Cybersecurity through network and graph data","Human centered data analytics for cyber security","Future directions in data analytics for cybersecurity"],"contributors":[{"value":"Janeja, Vandana P","kind":"author"}],"dates":[{"kind":"Publication date","value":"2022"}],"edition":"First edition.","holdings":[{"collection":"Cambridge eBooks and Partner Presses: Full EBA, All eBooks","format":"electronic resource","location":"https://na06.alma.exlibrisgroup.com/view/uresolver/01MIT_INST/openurl?u.ignore_date_coverage=true&portfolio_pid=53658698790006761&Force_direct=true"}],"identifiers":[{"value":"1-108-24632-X","kind":"ISBN"},{"value":"1-108-23195-0","kind":"ISBN"},{"value":"26930118ECA3DD8EDED4DACA97997439","kind":"OCLC Number"},{"value":"(CKB)24353022000041","kind":"OCLC Number"},{"value":"(UkCbUP)CR9781108231954","kind":"OCLC Number"},{"value":"(MiAaPQ)EBC7109862","kind":"OCLC Number"},{"value":"(Au-PeEL)EBL7109862","kind":"OCLC Number"},{"value":"1286068774","kind":"OCLC Number"},{"value":"(EXLCZ)9924353022000041","kind":"OCLC Number"}],"languages":["English"],"links":[{"url":"https://na06.alma.exlibrisgroup.com/view/uresolver/01MIT_INST/openurl?u.ignore_date_coverage=true&portfolio_pid=53658698790006761&Force_direct=true","kind":"Digital object URL","text":"Cambridge eBooks and Partner Presses: Full EBA, All eBooks"}],"literary_form":"Nonfiction","locations":[{"value":"England","kind":"Place of Publication"},{"value":"Cambridge ; New York, NY","kind":"Place of Publication"}],"notes":[{"value":["Vandana P. Janeja"],"kind":"Title Statement of Responsibility"},{"value":["Title from publisher's bibliographic system (viewed on 10 Aug 2022)"],"kind":"General Note"},{"value":["Includes bibliographical references and index"],"kind":"Bibliography Note"}],"physical_description":"1 online resource (xiii, 192 pages) : digital, PDF file(s).","publishers":[{"name":"Cambridge University Press","date":"2022","location":"Cambridge ; New York, NY"}],"subjects":[{"value":["Computer security - Data processing"],"kind":"Topical Term"},{"value":["Data mining"],"kind":"Topical Term"}],"summary":["As the world becomes increasingly connected, it is also more exposed to a myriad of cyber threats. We need to use multiple types of tools and techniques to learn and understand the evolving threat landscape. Data is a common thread linking various types of devices and end users. Analyzing data across different segments of cybersecurity domains, particularly data generated during cyber-attacks, can help us understand threats better, prevent future cyber-attacks, and provide insights into the evolving cyber threat landscape. This book takes a data oriented approach to studying cyber threats, showing in depth how traditional methods such as anomaly detection can be extended using data analytics and also applies data analytics to non-traditional views of cybersecurity, such as multi domain analysis, time series and spatial data analysis, and human-centered cybersecurity."],"timdex_provenance":{"source":"alma","run_date":"2026-02-12","run_id":"alma-daily-ingest-2026-02-12t09-17-27","run_record_offset":9049}},"sort":[31.494576,1640995200000]},{"_index":"alma-2025-03-01t03-00-02","_id":"alma:9936021890206761","_score":31.494576,"_source":{"source":"MIT Alma","source_link":"https://mit.primo.exlibrisgroup.com/discovery/fulldisplay?vid=01MIT_INST:MIT&docid=alma9936021890206761","timdex_record_id":"alma:9936021890206761","title":"Data analytics and AI","call_numbers":["QA276.4","001.4/22028563"],"citation":"Data analytics and AI. 2021. Boca Raton, FL : CRC Press, Taylor & Francis Group. Language material. https://mit.primo.exlibrisgroup.com/discovery/fulldisplay?vid=01MIT_INST:MIT&docid=alma9936021890206761","content_type":["Language material"],"contributors":[{"value":"Liebowitz, Jay","kind":"editor"}],"dates":[{"kind":"Publication date","value":"2021"}],"edition":"First edition.","holdings":[{"collection":"Taylor & Francis Discovery Collection","format":"electronic resource","location":"https://www.taylorfrancis.com/books/9781003019855"}],"identifiers":[{"value":"2020012383","kind":"LCCN"},{"value":"9781000094657. electronic book","kind":"ISBN"},{"value":"1000094650. electronic book","kind":"ISBN"},{"value":"9781003019855. electronic book","kind":"ISBN"},{"value":"1003019854. electronic book","kind":"ISBN"},{"value":"paperback","kind":"ISBN"},{"value":"hardcover","kind":"ISBN"},{"value":"tayfra9781003019855","kind":"OCLC Number"},{"value":"(NhCcYBP)tayfra9781003019855","kind":"OCLC Number"}],"languages":["English"],"links":[{"url":"https://www.taylorfrancis.com/books/9781003019855","kind":"Digital object URL"},{"url":"https://www.taylorfrancis.com/books/9781003019855","kind":"Digital object URL","text":"Taylor & Francis Discovery Collection"}],"literary_form":"Nonfiction","locations":[{"value":"Florida","kind":"Place of Publication"},{"value":"Boca Raton, FL","kind":"Place of Publication"}],"notes":[{"value":["edited by Jay Liebowitz, Distinguished Chair of Applied Business and Finance, Harrisburg University of Science and Technology"],"kind":"Title Statement of Responsibility"},{"value":["\"An Auerbach Book\" -- taken from title page"],"kind":"General Note"},{"value":["Includes bibliographical references and index"],"kind":"Bibliography Note"},{"value":["Description based on online resource; title from digital title page (viewed on September 29, 2020)"],"kind":"Source of Description Note"}],"physical_description":"1 online resource (xxiii, 242 pages) : illustrations (chiefly color).","publishers":[{"name":"CRC Press, Taylor & Francis Group","date":"2021","location":"Boca Raton, FL"},{"date":"©2021"}],"related_items":[{"description":"Data analytics applications","relationship":"In Series"}],"subjects":[{"value":["Statistics - Data processing"],"kind":"Topical Term"},{"value":["Artificial intelligence"],"kind":"Topical Term"},{"value":["Artificial Intelligence"],"kind":"Topical Term"}],"summary":["\"Two hot topics in recent years are data analytics and AI (artificial intelligence). These areas will continue to grow in importance for the foreseeable future. Unfortunately, both communities have not been communicating and collaborating with each other to build the necessary synergies. This book presents theory, applications, and case studies to bridge the gap between these fields\"--"],"timdex_provenance":{"source":"alma","run_date":"2026-02-07","run_id":"alma-daily-ingest-2026-02-07t09-21-29","run_record_offset":40606}},"sort":[31.494576,1609459200000]},{"_index":"alma-2025-03-01t03-00-02","_id":"alma:9935044073106761","_score":31.494576,"_source":{"source":"MIT Alma","source_link":"https://mit.primo.exlibrisgroup.com/discovery/fulldisplay?vid=01MIT_INST:MIT&docid=alma9935044073106761","timdex_record_id":"alma:9935044073106761","title":"Data Analytics in Sports","call_numbers":["GV716"],"citation":"Barlow, Janine (2015): Data Analytics in Sports. O'Reilly Media, Inc. Language material. https://mit.primo.exlibrisgroup.com/discovery/fulldisplay?vid=01MIT_INST:MIT&docid=alma9935044073106761","content_type":["Language material"],"contributors":[{"value":"Barlow, Janine","kind":"author"}],"dates":[{"kind":"Publication date","value":"2015"}],"edition":"1st edition","holdings":[{"collection":"O'Reilly Online Learning: Academic/Public Library Edition","format":"electronic resource","location":"https://na06.alma.exlibrisgroup.com/view/uresolver/01MIT_INST/openurl?u.ignore_date_coverage=true&portfolio_pid=53540434170006761&Force_direct=true"}],"identifiers":[{"value":"9781491927496","kind":"ISBN"},{"value":"1491927496","kind":"ISBN"},{"value":"(CKB)4920000000456960","kind":"OCLC Number"},{"value":"(CaSebORM)9781491927496","kind":"OCLC Number"},{"value":"1081175812","kind":"OCLC Number"},{"value":"on1081175812","kind":"OCLC Number"},{"value":"(EXLCZ)994920000000456960","kind":"OCLC Number"}],"languages":["English"],"links":[{"url":"https://na06.alma.exlibrisgroup.com/view/uresolver/01MIT_INST/openurl?u.ignore_date_coverage=true&portfolio_pid=53540434170006761&Force_direct=true","kind":"Digital object URL","text":"O'Reilly Online Learning: Academic/Public Library Edition"}],"literary_form":"Fiction","locations":[{"value":"No place, unknown, or undetermined","kind":"Place of Publication"}],"notes":[{"value":["Barlow, Janine"],"kind":"Title Statement of Responsibility"},{"value":["Online resource; Title from title page (viewed September 15, 2015)"],"kind":"Source of Description Note"}],"physical_description":"1 online resource (30 pages)","publishers":[{"name":"O'Reilly Media, Inc","date":"2015"}],"subjects":[{"value":["Sports - Data processing"],"kind":"Topical Term"},{"value":["Sports - Economic aspects"],"kind":"Topical Term"},{"value":["Big data"],"kind":"Topical Term"},{"value":["Information visualization"],"kind":"Topical Term"}],"summary":["As any child with a baseball card intuitively knows, sports and statistics go hand-in-hand. Yet, the general media disdain the flood of sports statistics available today: sports are pure and analytic tools are not. Well, if the so-called purists find tools like baseball’s sabermetrics upsetting, then they’d better brace themselves for the new wave of data analytics. In this O’Reilly report, Janine Barlow examines how advanced predictive analytics are impacting the world of sports—from the rise of tools such as Major League Baseball’s Statcast, which collects data on the movement of balls and players, to SportVU, which the National Basketball Association uses to collect spatial analysis data. You’ll also learn: How \"Dance Card\" makes accurate predictions about NCAA’s \"March Madness\" tournament Why data is crumbling long-standing myths about performance in soccer How the National Football League is using wearable devices to collect vital health data about its players It’s a new world in sports, where data analytics and related information technologies are changing the experience for teams, players, fans, and investors."],"timdex_provenance":{"source":"alma","run_date":"2025-02-28","run_id":"alma-full-ingest-2025-02-28t22-33-35","run_record_offset":75732}},"sort":[31.494576,1420070400000]},{"_index":"alma-2025-03-01t03-00-02","_id":"alma:9935763825606761","_score":30.79344,"_source":{"source":"MIT Alma","source_link":"https://mit.primo.exlibrisgroup.com/discovery/fulldisplay?vid=01MIT_INST:MIT&docid=alma9935763825606761","timdex_record_id":"alma:9935763825606761","title":"Data analytics and digital transformation","call_numbers":["HD30.2","004.0684"],"citation":"Beulen, Erik, Dans, Marla A (2024): Data analytics and digital transformation. London : Routledge, Taylor & Francis Group. Language material. https://mit.primo.exlibrisgroup.com/discovery/fulldisplay?vid=01MIT_INST:MIT&docid=alma9935763825606761","content_type":["Language material"],"contents":["Cover","Endorsements Page","Half Title","Series Page","Title Page","Copyright Page","Table of Contents","List of Figures","List of Tables","About the Authors","Preface","Part 1 Business Context","1 Digital Transformations Explained","2 Data Analytics Trends Clarified","Part 2 Data Analytics Foundation","3 Data-Driven Decision-Making","4 Monetization of data and data Analytics","5 Data Quality - Data Management in Action","6 Data Governance - Business and IT Collaboration","7 Data Compliance, Privacy, and Ethics","Part 3 Digital Transformation Phase Powered by data Analytics","8 Digital 1.0 - Supplementing the Going Concern with Digital Initiatives","9 Digital 2.0 - Siloed Digital to Integrated Digital","10 Digital 3.0 - Preparing for Digital Transformation 2025","Part 4 Data Sharing-Centric Digital Transformations","11 Data Management and Governance Implications of data Sharing","12 Data Sharing - Competitive and Sustainability, Compliance, Privacy, and Ethical Implications","13 Partnering in Ecosystems - How to Structure Collaboration?","Part 5 Aligning at the Crossroads of data Analytics and Digital Transformations","14 Identifying good Practices and Roadmaps for Aligning Analytics and Digital Organizational Goals","15 2030 Perspective on Leveraging data Analytics in Achieving Digital Transformation Success","References","Index"],"contributors":[{"value":"Beulen, Erik","kind":"author"},{"value":"Dans, Marla A","kind":"author"}],"dates":[{"kind":"Publication date","value":"2024"}],"holdings":[{"collection":"Taylor & Francis eBooks Complete","format":"electronic resource","location":"https://na06.alma.exlibrisgroup.com/view/uresolver/01MIT_INST/openurl?u.ignore_date_coverage=true&portfolio_pid=53703335250006761&Force_direct=true"}],"identifiers":[{"value":"9781003246770. (ebk)","kind":"ISBN"},{"value":"100324677X","kind":"ISBN"},{"value":"9781003807353. (ebook)","kind":"ISBN"},{"value":"1003807356","kind":"ISBN"},{"value":"9781003807315","kind":"ISBN"},{"value":"1003807313","kind":"ISBN"},{"value":"(MiAaPQ)EBC30767526","kind":"OCLC Number"},{"value":"(Au-PeEL)EBL30767526","kind":"OCLC Number"},{"value":"(CKB)28446180600041","kind":"OCLC Number"},{"value":"(EXLCZ)9928446180600041","kind":"OCLC Number"}],"languages":["English"],"links":[{"url":"https://na06.alma.exlibrisgroup.com/view/uresolver/01MIT_INST/openurl?u.ignore_date_coverage=true&portfolio_pid=53703335250006761&Force_direct=true","kind":"Digital object URL","text":"Taylor & Francis eBooks Complete"}],"literary_form":"Nonfiction","locations":[{"value":"England","kind":"Place of Publication"},{"value":"London","kind":"Place of Publication"}],"notes":[{"value":["Erik Beulen and Marla A. Dans"],"kind":"Title Statement of Responsibility"},{"value":["Includes bibliographical references and index"],"kind":"Bibliography Note"},{"value":["Description based on print version record"],"kind":"Source of Description Note"}],"physical_description":"1 online resource (257 pages) : illustrations","publishers":[{"name":"Routledge, Taylor & Francis Group","date":"2024","location":"London"},{"date":"©2024"}],"related_items":[{"description":"Business and digital transformation","relationship":"In Series"}],"subjects":[{"value":["Information technology - Management"],"kind":"Topical Term"},{"value":["Big data - Management"],"kind":"Topical Term"},{"value":["Management - Statistical methods"],"kind":"Topical Term"},{"value":["Strategic planning"],"kind":"Topical Term"}],"summary":["Understanding the significance of data analytics is paramount for digital transformation but in many organizations they are separate units without fully aligned goals. As organizations are applying digital transformations to be adaptive and agile in a competitive environment, data analytics can play a critical role in their success. This book explores the crossroads between them and how to leverage their connection for improved business outcomes. The need to collaborate and share data is becoming an integral part of digital transformation. This not only creates new opportunities but also requires well-considered and continuously assessed decision-making as competitiveness is at stake. This book details approaches, concepts, and frameworks, as well as actionable insights and good practices, including combined data management and agile concepts. Critical issues are discussed such as data quality and data governance, as well as compliance, privacy, and ethics. It also offers insights into how both private and public organizations can innovate and keep up with growing data volumes and increasing technological developments in the short, mid, and long term. This book will be of direct appeal to global researchers and students across a range of business disciplines, including technology and innovation management, organizational studies, and strategic management. It is also relevant for policy makers, regulators, and executives of private and public organizations looking to implement successful transformation policies."],"timdex_provenance":{"source":"alma","run_date":"2025-12-24","run_id":"alma-daily-ingest-2025-12-24t14-20-23","run_record_offset":4462}},"sort":[30.79344,1704067200000]},{"_index":"alma-2025-03-01t03-00-02","_id":"alma:9935248399006761","_score":30.79344,"_source":{"source":"MIT Alma","source_link":"https://mit.primo.exlibrisgroup.com/discovery/fulldisplay?vid=01MIT_INST:MIT&docid=alma9935248399006761","timdex_record_id":"alma:9935248399006761","title":"Data analytics using Python visualizations","call_numbers":["QA76.73.P98","005.133"],"citation":"Data analytics using Python visualizations. 2022. [Place of publication not identified] : Packt Publishing. Projected medium. https://mit.primo.exlibrisgroup.com/discovery/fulldisplay?vid=01MIT_INST:MIT&docid=alma9935248399006761","content_type":["Projected medium"],"contributors":[{"value":"Dasgupta, Manas","kind":"presenter"},{"value":"Packt Publishing","kind":"publisher"}],"dates":[{"kind":"Publication date","value":"2022"}],"edition":"[First edition].","holdings":[{"collection":"O'Reilly Online Learning: Academic/Public Library Edition","format":"electronic resource","location":"https://na06.alma.exlibrisgroup.com/view/uresolver/01MIT_INST/openurl?u.ignore_date_coverage=true&portfolio_pid=53647178910006761&Force_direct=true"}],"identifiers":[{"value":"9781804614839","kind":"ISBN"},{"value":"1804614831","kind":"ISBN"},{"value":"(CKB)5590000000932030","kind":"OCLC Number"},{"value":"1334599801","kind":"OCLC Number"},{"value":"(OCoLC-P)1334599801","kind":"OCLC Number"},{"value":"(CaSebORM)9781804614839","kind":"OCLC Number"},{"value":"(EXLCZ)995590000000932030","kind":"OCLC Number"}],"languages":["English"],"links":[{"url":"https://na06.alma.exlibrisgroup.com/view/uresolver/01MIT_INST/openurl?u.ignore_date_coverage=true&portfolio_pid=53647178910006761&Force_direct=true","kind":"Digital object URL","text":"O'Reilly Online Learning: Academic/Public Library Edition"}],"locations":[{"value":"No place, unknown, or undetermined","kind":"Place of Publication"},{"value":"[Place of publication not identified]","kind":"Place of Publication"}],"notes":[{"value":["\"Updated in June 2022.\""],"kind":"General Note"},{"value":["OCLC-licensed vendor bibliographic record"],"kind":"Source of Description Note"}],"physical_description":"1 online resource (1 video file (6 hr., 28 min.)) : sound, color.","publishers":[{"name":"Packt Publishing","date":"[2022]","location":"[Place of publication not identified]"}],"subjects":[{"value":["Computer science"],"kind":"Topical Term"},{"value":["Python (Computer program language)"],"kind":"Topical Term"},{"value":["Electronic data processing"],"kind":"Topical Term"}],"summary":["Master data science, ML, and analytics with powerful visualizations using Matplotlib, Seaborn, and Bokeh. About This Video The art of presenting data in the form of powerful, innovative, and intuitive visualizations In-depth coverage of Matplotlib, Seaborn, and Bokeh visualization libraries Use of data analytics techniques/Exploratory Data Analysis (EDA) using several data generations and manipulation methods In Detail If you are working on machine learning projects and want to find patterns and insights from your data on your way to building models, then this course is for you. This course takes a holistic approach to teach visualization techniques. We will be taking real-life business scenarios and raw data to go through detailed Exploratory Data Analysis (EDA) techniques to prepare the raw data to suit the appropriate visualization needs. You will learn about data analytics and exploratory data analysis techniques using multiple different data structures with NumPy and Pandas libraries. You will also learn various chart/graph types, customization/configuration, and vectorization techniques. We will look at advanced visualizations using business applications such as single and multiple bar charts, pie charts, and bubble charts with the vectorization of properties. We will further explore Seaborn Boxplot, Violin plot, Categorical Scatterplot, and how to create heat maps. By the end of the course, you will learn the foundational techniques of data analytics and deeper customizations on visualizations. You will be able to confidently use Python visualization libraries such as Matplotlib, Seaborn, and Bokeh in your future projects.\\ Audience This course is for Python and machine learning developers, data scientists, data analysts, and business analysts. This course will also be beneficial to leaders, managers, and anyone whose job involves presenting data in the form of visuals, which include developers, architects, and system analysts. A basic understanding of Python will be helpful, but not mandatory."],"timdex_provenance":{"source":"alma","run_date":"2025-02-28","run_id":"alma-full-ingest-2025-02-28t22-33-35","run_record_offset":196493}},"sort":[30.79344,1640995200000]},{"_index":"alma-2025-03-01t03-00-02","_id":"alma:9935444795806761","_score":30.79344,"_source":{"source":"MIT Alma","source_link":"https://mit.primo.exlibrisgroup.com/discovery/fulldisplay?vid=01MIT_INST:MIT&docid=alma9935444795806761","timdex_record_id":"alma:9935444795806761","title":"Data analytics using Python visualizations","alternate_titles":[{"value":"Title on screen: Complete 2021 Python visualizations bootcamp","kind":"Varying Form of Title"}],"call_numbers":["QA76.73.P98","005.133"],"citation":"Dasgupta, Manas (Solutions architect) (2022): Data analytics using Python visualizations. Birmingham, England : PACKT Publishing. Projected medium. https://mit.primo.exlibrisgroup.com/discovery/fulldisplay?vid=01MIT_INST:MIT&docid=alma9935444795806761","content_type":["Projected medium"],"contributors":[{"value":"Dasgupta, Manas (Solutions architect)","kind":"author"},{"value":"Dasgupta, Manas (Solutions architect)","kind":"instructor"},{"value":"Packt Publishing","kind":"production company"},{"value":"Packt Publishing","kind":"publisher"}],"dates":[{"kind":"Publication date","value":"2022"}],"edition":"[First edition].","holdings":[{"collection":"Academic Video Online (AVON)","format":"electronic resource","location":"https://na06.alma.exlibrisgroup.com/view/uresolver/01MIT_INST/openurl?u.ignore_date_coverage=true&portfolio_pid=53660982330006761&Force_direct=true"}],"identifiers":[{"value":"(CKB)5590000001028878","kind":"OCLC Number"},{"value":"1334599801","kind":"OCLC Number"},{"value":"(VaAlASP)5373529","kind":"OCLC Number"},{"value":"(VaAlASP)ASP5373529/marc","kind":"OCLC Number"},{"value":"(OCoLC-P)1334599801","kind":"OCLC Number"},{"value":"(CaSebORM)9781804614839","kind":"OCLC Number"},{"value":"(EXLCZ)995590000001028878","kind":"OCLC Number"}],"languages":["English","In English"],"links":[{"url":"https://na06.alma.exlibrisgroup.com/view/uresolver/01MIT_INST/openurl?u.ignore_date_coverage=true&portfolio_pid=53660982330006761&Force_direct=true","kind":"Digital object URL","text":"Academic Video Online (AVON)"}],"locations":[{"value":"England","kind":"Place of Publication"},{"value":"Birmingham, England","kind":"Place of Publication"}],"notes":[{"value":["Manas Dasgupta"],"kind":"Title Statement of Responsibility"},{"value":["Title from resource description page (viewed March 13, 2023)"],"kind":"General Note"},{"value":["Manas Dasgupta, presenter"],"kind":"Participant or Performer Note"}],"physical_description":"1 online resource (387 minutes)","publishers":[{"name":"PACKT Publishing","date":"2022","location":"Birmingham, England"}],"subjects":[{"value":["Electronic data processing"],"kind":"Topical Term"},{"value":["Information visualization"],"kind":"Topical Term"},{"value":["Python (Computer program language)"],"kind":"Topical Term"},{"value":["Visual analytics"],"kind":"Topical Term"}],"summary":["f you are working on machine learning projects and want to find patterns and insights from your data on your way to building models, then this course is for you. This course takes a holistic approach to teach visualization techniques.  We will be taking real-life business scenarios and raw data to go through detailed Exploratory Data Analysis (EDA) techniques to prepare the raw data to suit the appropriate visualization needs. You will learn about data analytics and exploratory data analysis techniques using multiple different data structures with NumPy and Pandas libraries. You will also learn various chart/graph types, customization/configuration, and vectorization techniques.  We will look at advanced visualizations using business applications such as single and multiple bar charts, pie charts, and bubble charts with the vectorization of properties. We will further explore Seaborn Boxplot, Violin plot, Categorical Scatterplot, and how to create heat maps.  By the end of the course, you will learn the foundational techniques of data analytics and deeper customizations on visualizations. You will be able to confidently use Python visualization libraries such as Matplotlib, Seaborn, and Bokeh in your future projects."],"timdex_provenance":{"source":"alma","run_date":"2026-03-26","run_id":"alma-daily-ingest-2026-03-26t08-31-22","run_record_offset":6857}},"sort":[30.79344,1640995200000]},{"_index":"alma-2025-03-01t03-00-02","_id":"alma:9935199842206761","_score":30.79344,"_source":{"source":"MIT Alma","source_link":"https://mit.primo.exlibrisgroup.com/discovery/fulldisplay?vid=01MIT_INST:MIT&docid=alma9935199842206761","timdex_record_id":"alma:9935199842206761","title":"Data Analytics in Power Markets","call_numbers":["HD9685.A2","363.620212"],"citation":"Chen, Qixin (2021): Data Analytics in Power Markets. Singapore : Springer Nature Singapore :. Language material. https://mit.primo.exlibrisgroup.com/discovery/fulldisplay?vid=01MIT_INST:MIT&docid=alma9935199842206761","content_type":["Language material"],"contents":["Introduction to power market data and their characteristics","Modeling load forecasting uncertainty using deep learning models","Data-driven load data cleaning and its impacts on forecasting performance","Generalized cost-oriented load forecasting in economic dispatch","A monthly electricity consumption forecasting method","Data-driven pattern extraction for analyzing market bidding behaviors","Stochastic optimal offering based on probabilistic forecast on aggregated supply curves","Power market simulation framework based on learning from individual offering strategy","Deep inverse reinforcement learning for reward function identification in bidding models","The subspace characteristics and congestion identification of LMP data","Online transmission topology identification in LMP-based markets","Day-ahead componential electricity price forecasting","Quantifying the impact of price forecasting error on market bidding","Virtual bidding and FTR speculation based on probabilistic LMP forecasting","Abnormal detection of LMP scenario and data with deep neural networks"],"contributors":[{"value":"Chen, Qixin","kind":"author"}],"dates":[{"kind":"Publication date","value":"2021"}],"edition":"1st ed. 2021.","holdings":[{"collection":"SpringerLink Books Energy","format":"electronic resource","location":"https://na06.alma.exlibrisgroup.com/view/uresolver/01MIT_INST/openurl?u.ignore_date_coverage=true&portfolio_pid=53635138920006761&Force_direct=true"}],"identifiers":[{"value":"981-16-4975-8","kind":"ISBN"},{"value":"10.1007/978-981-16-4975-2. doi","kind":"Other Identifier"},{"value":"(CKB)5360000000049948","kind":"OCLC Number"},{"value":"(MiAaPQ)EBC6739146","kind":"OCLC Number"},{"value":"(Au-PeEL)EBL6739146","kind":"OCLC Number"},{"value":"1273475861","kind":"OCLC Number"},{"value":"(PPN)25830295X","kind":"OCLC Number"},{"value":"(DE-He213)978-981-16-4975-2","kind":"OCLC Number"},{"value":"(EXLCZ)995360000000049948","kind":"OCLC Number"}],"languages":["English"],"links":[{"url":"https://na06.alma.exlibrisgroup.com/view/uresolver/01MIT_INST/openurl?u.ignore_date_coverage=true&portfolio_pid=53635138920006761&Force_direct=true","kind":"Digital object URL","text":"SpringerLink Books Energy"}],"literary_form":"Nonfiction","locations":[{"value":"Singapore","kind":"Place of Publication"}],"notes":[{"value":["by Qixin Chen, Hongye Guo, Kedi Zheng, Yi Wang"],"kind":"Title Statement of Responsibility"}],"physical_description":"1 online resource (291 pages)","publishers":[{"name":"Springer Nature Singapore :","date":"2021","location":"Singapore"}],"subjects":[{"value":["Energy policy"],"kind":"Topical Term"},{"value":["Machine learning"],"kind":"Topical Term"},{"value":["Electric power production"],"kind":"Topical Term"},{"value":["Power resources"],"kind":"Topical Term"},{"value":["Environmental economics"],"kind":"Topical Term"},{"value":["Energy Policy, Economics and Management"],"kind":"Topical Term"},{"value":["Machine Learning"],"kind":"Topical Term"},{"value":["Electrical Power Engineering"],"kind":"Topical Term"},{"value":["Resource and Environmental Economics"],"kind":"Topical Term"}],"summary":["This book aims to solve some key problems in the decision and optimization procedure for power market organizers and participants in data-driven approaches. It begins with an overview of the power market data and analyzes on their characteristics and importance for market clearing. Then, the first part of the book discusses the essential problem of bus load forecasting from the perspective of market organizers. The related works include load uncertainty modeling, bus load bad data correction, and monthly load forecasting. The following part of the book answers how much information can be obtained from public data in locational marginal price (LMP)-based markets. It introduces topics such as congestion identification, componential price forecasting, quantifying the impact of forecasting error, and financial transmission right investment. The final part of the book answers how to model the complex market bidding behaviors. Specific works include pattern extraction, aggregated supply curve forecasting, market simulation, and reward function identification in bidding. These methods are especially useful for market organizers to understand the bidding behaviors of market participants and make essential policies. It will benefit and inspire researchers, graduate students, and engineers in the related fields."],"timdex_provenance":{"source":"alma","run_date":"2025-11-07","run_id":"alma-daily-ingest-2025-11-07t09-25-08","run_record_offset":21881}},"sort":[30.79344,1609459200000]},{"_index":"alma-2025-03-01t03-00-02","_id":"alma:9936020869006761","_score":30.79344,"_source":{"source":"MIT Alma","source_link":"https://mit.primo.exlibrisgroup.com/discovery/fulldisplay?vid=01MIT_INST:MIT&docid=alma9936020869006761","timdex_record_id":"alma:9936020869006761","title":"Data analytics in project management","call_numbers":["HD69.P75","658.4/040285"],"citation":"Data analytics in project management. 2019. Boca Raton, FL : CRC Press, Taylor and Francis Group. Language material. https://mit.primo.exlibrisgroup.com/discovery/fulldisplay?vid=01MIT_INST:MIT&docid=alma9936020869006761","content_type":["Language material"],"contents":["Why data analytics in project management?","J. Davidson Frame and Yanping Chen","Data analytics risk : lost in translation?","Carl Pritchard","Analytical challenges of a modern PMO","Seweryn Spalek","Data analytics and project portfolio management","Alfonso Bucero","Earned value method","Werner Meyer","How to manage big data issues in a project environment","Ryan Legard","IT solutions of data analytics as applied to project management","Michael Bragen","Conventional and unconventional data mining for better decision-making","Klas Skogmar","Agile project management and data analytics","Deanne Larson","Data analytics and scrum","Bert Brijs"],"contributors":[{"value":"Spalek, Seweryn","kind":"editor"}],"dates":[{"kind":"Publication date","value":"2019"}],"holdings":[{"collection":"Taylor & Francis Discovery Collection","format":"electronic resource","location":"https://www.taylorfrancis.com/books/9780429434891"}],"identifiers":[{"value":"2020692569","kind":"LCCN"},{"value":"9780429786358. epub","kind":"ISBN"},{"value":"0429786352","kind":"ISBN"},{"value":"alk. paper","kind":"ISBN"},{"value":"9780429786365","kind":"ISBN"},{"value":"0429786360","kind":"ISBN"},{"value":"0429434898. (electronic bk.)","kind":"ISBN"},{"value":"9780429786341. (electronic bk. ;. Mobipocket)","kind":"ISBN"},{"value":"0429786344. (electronic bk. ;. Mobipocket)","kind":"ISBN"},{"value":"9780429434891. (electronic bk.)","kind":"ISBN"},{"value":"10.1201/9780429434891. doi","kind":"Other Identifier"},{"value":"tayfra9780429434891","kind":"OCLC Number"},{"value":"(NhCcYBP)tayfra9780429434891","kind":"OCLC Number"}],"languages":["English"],"links":[{"url":"https://www.taylorfrancis.com/books/9780429434891","kind":"Digital object URL"},{"url":"https://www.taylorfrancis.com/books/9780429434891","kind":"Digital object URL","text":"Taylor & Francis Discovery Collection"}],"literary_form":"Nonfiction","locations":[{"value":"Florida","kind":"Place of Publication"},{"value":"Boca Raton, FL","kind":"Place of Publication"}],"notes":[{"value":["edited by Seweryn Spalek"],"kind":"Title Statement of Responsibility"},{"value":["Includes bibliographical references and index"],"kind":"Bibliography Note"},{"value":["Description based on print version record"],"kind":"Source of Description Note"}],"physical_description":"1 online resource","publishers":[{"name":"CRC Press, Taylor and Francis Group","date":"[2019]","location":"Boca Raton, FL"}],"related_items":[{"description":"Data analytics applications","relationship":"In Series"}],"subjects":[{"value":["Project management - Data processing"],"kind":"Topical Term"},{"value":["Project management - Statistical methods"],"kind":"Topical Term"}],"summary":["This book aims to help the reader better understand the importance of data analysis in project management. Moreover, it provides guidance by showing tools, methods, techniques and lessons learned on how to better utilize the data gathered from the projects. First and foremost, insight into the bridge between data analytics and project management aids practitioners looking for ways to maximize the practical value of data procured. The book equips organizations with the know-how necessary to adapt to a changing workplace dynamic through key lessons learned from past ventures. The book's integrated approach to investigating both fields enhances the value of research findings."],"timdex_provenance":{"source":"alma","run_date":"2026-02-07","run_id":"alma-daily-ingest-2026-02-07t09-21-29","run_record_offset":60143}},"sort":[30.79344,1546300800000]},{"_index":"alma-2025-03-01t03-00-02","_id":"alma:9936021139106761","_score":30.79344,"_source":{"source":"MIT Alma","source_link":"https://mit.primo.exlibrisgroup.com/discovery/fulldisplay?vid=01MIT_INST:MIT&docid=alma9936021139106761","timdex_record_id":"alma:9936021139106761","title":"Data analytics applications in education","call_numbers":["LB1028.43","370.285"],"citation":"Data analytics applications in education. 2018. Boca Raton, FL : CRC Press. Language material. https://mit.primo.exlibrisgroup.com/discovery/fulldisplay?vid=01MIT_INST:MIT&docid=alma9936021139106761","content_type":["Language material"],"contents":["Big data analytics in a learning environment / Kristof De Witte and Jan Vanthienen","Improved student feedback with process and data analytics / Johannes De Smedt, Seppe vanden Broucke, Jan Vanthienen and Kristof De Witte","Towards data for development : a model on learning communities as a platform for growing data use / Wouter Schelfhout","The impact of fraudulent behavior on the usefulness of learning analytics applications : the case of question and answer sharing with medium-stakes online quizzing in higher education / Silvester Draaijer and Chris van Klaveren","Disentangling faculty efficiency from students' effort / Cristian Barra, Sergio Destefanis, Vania Sena and Roberto Zotti","Using data analytics to benchmark schools : the case of Portugal / Maria Conceição Portela and Ana S. Camanho","The use of educational data mining procedures to assess students' performance in a bayesian framework / Kristof De Witte, Grazia Graziosi and Joris Hindryckx","Using statistical analytics to study school performance through administrative datasets / Tommaso Agasisti, Francesca Ieva, Chiara Masci, Anna Maria Paganoni, and Mara Soncin","The governance of big data in higher education / Kurt De Wit and Bruno Broucker","Evidence based education and its implications for research and data analytics with an application to the overeducation literature / Wim Groot and Henriëtte Maassen van den Brink"],"contributors":[{"value":"Vanthienen, Jan","kind":"editor"},{"value":"Witte, K. de (Kristof)","kind":"editor"}],"dates":[{"kind":"Publication date","value":"2018"}],"holdings":[{"collection":"Taylor & Francis Discovery Collection","format":"electronic resource","location":"https://www.taylorfrancis.com/books/9781315154145"}],"identifiers":[{"value":"9781351650182 (electronic bk.)","kind":"ISBN"},{"value":"1351650181 (electronic bk.)","kind":"ISBN"},{"value":"tayfra9781315154145","kind":"OCLC Number"},{"value":"(NhCcYBP)tayfra9781315154145","kind":"OCLC Number"}],"languages":["English"],"links":[{"url":"https://www.taylorfrancis.com/books/9781315154145","kind":"Digital object URL"},{"url":"https://www.taylorfrancis.com/books/9781315154145","kind":"Digital object URL","text":"Taylor & Francis Discovery Collection"}],"literary_form":"Nonfiction","locations":[{"value":"Florida","kind":"Place of Publication"},{"value":"Boca Raton, FL","kind":"Place of Publication"}],"notes":[{"value":["edited by Jan Vanthienen and Kristof De Witte"],"kind":"Title Statement of Responsibility"},{"value":["Includes bibliographical references"],"kind":"Bibliography Note"},{"value":["Description based on print version record"],"kind":"Source of Description Note"}],"physical_description":"1 online resource (pages cm.)","publishers":[{"name":"CRC Press","date":"2018","location":"Boca Raton, FL"}],"subjects":[{"value":["Education - Data processing"],"kind":"Topical Term"},{"value":["Educational statistics"],"kind":"Topical Term"},{"value":["Big data"],"kind":"Topical Term"}],"timdex_provenance":{"source":"alma","run_date":"2026-02-07","run_id":"alma-daily-ingest-2026-02-07t09-21-29","run_record_offset":64310}},"sort":[30.79344,1514764800000]},{"_index":"alma-2025-03-01t03-00-02","_id":"alma:9935440988006761","_score":30.79344,"_source":{"source":"MIT Alma","source_link":"https://mit.primo.exlibrisgroup.com/discovery/fulldisplay?vid=01MIT_INST:MIT&docid=alma9935440988006761","timdex_record_id":"alma:9935440988006761","title":"Data Analytics for Smart Cities","call_numbers":["TD159.4","307.760285"],"citation":"Data Analytics for Smart Cities. 2018. Milton : Auerbach Publications. Language material. https://mit.primo.exlibrisgroup.com/discovery/fulldisplay?vid=01MIT_INST:MIT&docid=alma9935440988006761","content_type":["Language material"],"contents":["Smartphone technology integrated with machine learning for airport pavement condition assessment / Amir Alavi, William Buttlar","Global satellite observations for smart cities / Zhong Liu, Menglin S. Jin, Jacqueline Liu, Angela Li, William Teng, Bruce Vollmer, and D. Meyer","Advancing smart and resilient cities with big spatial disaster data : challenges, progresses, and opportunities / Xuan Hu and Jie Gong","Smart city portrayal : dynamic visualization applied to the analysis of underground metro / Evgheni Polisciuc and Penousal Machado","Smart bike-sharing systems for smart cities / Hesham A. Rakha","Indirect monitoring of critical transport infrastructure : data analytics and signal processing / Abdollah Malekjafarian","Big data exploration to examine aggressive driving behavior in the era of smart cities / Arash Jahangiri","Exploratory analysis of run-off-road crash patterns / Mohammad Jalayer","Predicting traffic safety risk factors using an ensemble classifier / Nasim Arbabzadeh","Architecture design of internet of things-enabled cloud platform for managing the production of prefabricated public houses / Clyde Zhengdao Li"],"contributors":[{"value":"Alavi, Amir","kind":"Not specified"},{"value":"Buttlar, William G","kind":"Not specified"}],"dates":[{"kind":"Publication date","value":"2018"}],"edition":"1st ed.","holdings":[{"collection":"Taylor & Francis eBooks Complete","format":"electronic resource","location":"https://na06.alma.exlibrisgroup.com/view/uresolver/01MIT_INST/openurl?u.ignore_date_coverage=true&portfolio_pid=53660230530006761&Force_direct=true"}],"identifiers":[{"value":"0-429-43498-7","kind":"ISBN"},{"value":"0-429-78662-X","kind":"ISBN"},{"value":"0-429-78663-8","kind":"ISBN"},{"value":"9780429434983","kind":"ISBN"},{"value":"(CKB)4100000007121405","kind":"OCLC Number"},{"value":"(MiAaPQ)EBC5566778","kind":"OCLC Number"},{"value":"1061098835","kind":"OCLC Number"},{"value":"(OCoLC-P)1061098835","kind":"OCLC Number"},{"value":"(FlBoTFG)9780429434983","kind":"OCLC Number"},{"value":"(EXLCZ)994100000007121405","kind":"OCLC Number"}],"languages":["English"],"links":[{"url":"https://na06.alma.exlibrisgroup.com/view/uresolver/01MIT_INST/openurl?u.ignore_date_coverage=true&portfolio_pid=53660230530006761&Force_direct=true","kind":"Digital object URL","text":"Taylor & Francis eBooks Complete"}],"literary_form":"Nonfiction","locations":[{"value":"No place, unknown, or undetermined","kind":"Place of Publication"},{"value":"Milton","kind":"Place of Publication"}],"notes":[{"value":["edited by Amir H. Alavi, William G. Buttlar"],"kind":"Title Statement of Responsibility"},{"value":["4.3.2 Color-Coding"],"kind":"General Note"},{"value":["Includes bibliographical references and index"],"kind":"Bibliography Note"},{"value":["Description based on print version record"],"kind":"Source of Description Note"}],"physical_description":"1 online resource (255 pages) : illustrations (some color).","publishers":[{"name":"Auerbach Publications","date":"2018","location":"Milton"}],"related_items":[{"description":"Data analytics applications","relationship":"In Series"}],"subjects":[{"value":["Smart cities"],"kind":"Topical Term"},{"value":["Big data"],"kind":"Topical Term"},{"value":["Quantitative research"],"kind":"Topical Term"}],"summary":["The development of smart cities is one of the most important challenges over the next few decades. Governments and companies are leveraging billions of dollars in public and private funds for smart cities. Next generation smart cities are heavily dependent on distributed smart sensing systems and devices to monitor the urban infrastructure. The smart sensor networks serve as autonomous intelligent nodes to measure a variety of physical or environmental parameters. They should react in time, establish automated control, and collect information for intelligent decision-making. In this context, one of the major tasks is to develop advanced frameworks for the interpretation of the huge amount of information provided by the emerging testing and monitoring systems. Data Analytics for Smart Cities brings together some of the most exciting new developments in the area of integrating advanced data analytics systems into smart cities along with complementary technological paradigms such as cloud computing and Internet of Things (IoT). The book serves as a reference for researchers and engineers in domains of advanced computation, optimization, and data mining for smart civil infrastructure condition assessment, dynamic visualization, intelligent transportation systems (ITS), cyber-physical systems, and smart construction technologies. The chapters are presented in a hands-on manner to facilitate researchers in tackling applications. Arguably, data analytics technologies play a key role in tackling the challenge of creating smart cities. Data analytics applications involve collecting, integrating, and preparing time- and space-dependent data produced by sensors, complex engineered systems, and physical assets, followed by developing and testing analytical models to verify the accuracy of results. This book covers this multidisciplinary field and examines multiple paradigms such as machine learning, pattern recognition, statistics, intelligent databases, knowledge acquisition, data visualization, high performance computing, and expert systems. The book explores new territory by discussing the cutting-edge concept of Big Data analytics for interpreting massive amounts of data in smart city applications."],"timdex_provenance":{"source":"alma","run_date":"2026-04-30","run_id":"alma-daily-ingest-2026-04-30t09-50-30","run_record_offset":3964}},"sort":[30.79344,1514764800000]},{"_index":"alma-2025-03-01t03-00-02","_id":"alma:9936022186606761","_score":30.79344,"_source":{"source":"MIT Alma","source_link":"https://mit.primo.exlibrisgroup.com/discovery/fulldisplay?vid=01MIT_INST:MIT&docid=alma9936022186606761","timdex_record_id":"alma:9936022186606761","title":"Data analytics for internal auditors","call_numbers":["HF5668","657/.458"],"citation":"Cascarino, Richard (2017): Data analytics for internal auditors. Boca Raton : CRC Press, Taylor & Francis Group. Language material. https://mit.primo.exlibrisgroup.com/discovery/fulldisplay?vid=01MIT_INST:MIT&docid=alma9936022186606761","content_type":["Language material"],"contents":["Chapter 1. Introduction to data analysis","chapter 2. Understanding sampling","chapter 3. Judgmental versus statistical sampling","chapter 4. Probability theory in data analysis","chapter 5. Types of evidence","chapter 6. Population analysis","chapter 7. Correlations, regressions, and other analyses","chapter 8. Conducting the audit","chapter 9. Obtaining information from IT systems for analysis","chapter 10. Use of computer-assisted audit techniques","chapter 11. Analysis of big data","chapter 12. Results analysis and validation","chapter 13. Fraud detection using data analysis","chapter 14. Root cause analysis","chapter 15. Data analysis and continuous monitoring","chapter 16. Continous auditing","chapter 17. Financial analysis","chapter 18. Excel and data analysis","chapter 19. ACL and data analysis","chapter 20. IDEA and data analysis","chapter 21. SAS and data analysis","chapter 22. Analysis reporting","chapter 23. Data visualization and presentation","chapte 24. Conclusion"],"contributors":[{"value":"Cascarino, Richard","kind":"author"}],"dates":[{"kind":"Publication date","value":"2017"}],"holdings":[{"collection":"Taylor & Francis Discovery Collection","format":"electronic resource","location":"https://www.taylorfrancis.com/books/9781315369532"}],"identifiers":[{"value":"9781498737159. (electronic bk.)","kind":"ISBN"},{"value":"1498737153. (electronic bk.)","kind":"ISBN"},{"value":"9781315369532. (electronic bk.)","kind":"ISBN"},{"value":"1315369532. (electronic bk.)","kind":"ISBN"},{"value":"tayfra9781315369532","kind":"OCLC Number"},{"value":"(NhCcYBP)tayfra9781315369532","kind":"OCLC Number"}],"languages":["English"],"links":[{"url":"https://www.taylorfrancis.com/books/9781315369532","kind":"Digital object URL"},{"url":"https://www.taylorfrancis.com/books/9781315369532","kind":"Digital object URL","text":"Taylor & Francis Discovery Collection"}],"literary_form":"Nonfiction","locations":[{"value":"Florida","kind":"Place of Publication"},{"value":"Boca Raton","kind":"Place of Publication"}],"notes":[{"value":["Richard E. Cascarino"],"kind":"Title Statement of Responsibility"},{"value":["\"An Auerbach book.\""],"kind":"General Note"},{"value":["Includes bibliographical references and index"],"kind":"Bibliography Note"},{"value":["Online resource; title from PDF title page (EBSCO, viewed March 23, 2017)"],"kind":"Source of Description Note"}],"physical_description":"1 online resource : illustrations","publishers":[{"name":"CRC Press, Taylor & Francis Group","date":"[2017]","location":"Boca Raton"},{"date":"©20"},{"date":"©2017"}],"related_items":[{"description":"Internal audit and IT audit","relationship":"In Series"}],"subjects":[{"value":["Auditing, Internal"],"kind":"Topical Term"},{"value":["Electronic data processing - Auditing"],"kind":"Topical Term"}],"summary":["Providing a reference guide for IT and Internal Auditors as well as Fraud Examiners, this book presents information written from the practitioner's viewpoint covering not only the need and the theory, but a practical hands-on approach to conducting data analytics. --"],"timdex_provenance":{"source":"alma","run_date":"2026-02-07","run_id":"alma-daily-ingest-2026-02-07t09-21-29","run_record_offset":39970}},"sort":[30.79344,1483228800000]},{"_index":"alma-2025-03-01t03-00-02","_id":"alma:9935113615206761","_score":30.79344,"_source":{"source":"MIT Alma","source_link":"https://mit.primo.exlibrisgroup.com/discovery/fulldisplay?vid=01MIT_INST:MIT&docid=alma9935113615206761","timdex_record_id":"alma:9935113615206761","title":"Data Analytics for Protein Crystallization","call_numbers":["QH506","572.8"],"citation":"Pusey, Marc L, Aygün, Ramazan Savaş (2017): Data Analytics for Protein Crystallization. Cham : Springer International Publishing :. Language material. https://mit.primo.exlibrisgroup.com/discovery/fulldisplay?vid=01MIT_INST:MIT&docid=alma9935113615206761","content_type":["Language material"],"contents":["Introduction to Protein Crystallization","Scoring and Phases of Crystallization","Computational Methods for Protein Crystallization Screening","Robotic Image Acquisition","Classification of Crystallization Trial Images","Crystal Growth Analysis","Focal Stacking for Crystallization Microscopy","Crystal Image Region Segmentation","Visualization","Other Structure Determination Methods","Future of Computational Protein Crystallization"],"contributors":[{"value":"Pusey, Marc L","kind":"author"},{"value":"Aygün, Ramazan Savaş","kind":"author"}],"dates":[{"kind":"Publication date","value":"2017"}],"edition":"1st ed. 2017.","holdings":[{"collection":"Springer Nature - Springer Computer Science eBooks 2017 English International","format":"electronic resource","location":"https://na06.alma.exlibrisgroup.com/view/uresolver/01MIT_INST/openurl?u.ignore_date_coverage=true&portfolio_pid=53690428910006761&Force_direct=true"}],"identifiers":[{"value":"3-319-58937-7","kind":"ISBN"},{"value":"10.1007/978-3-319-58937-4. doi","kind":"Other Identifier"},{"value":"(CKB)4340000000223226","kind":"OCLC Number"},{"value":"(DE-He213)978-3-319-58937-4","kind":"OCLC Number"},{"value":"(MiAaPQ)EBC5163202","kind":"OCLC Number"},{"value":"(PPN)221252045","kind":"OCLC Number"},{"value":"(EXLCZ)994340000000223226","kind":"OCLC Number"}],"languages":["English"],"links":[{"url":"https://na06.alma.exlibrisgroup.com/view/uresolver/01MIT_INST/openurl?u.ignore_date_coverage=true&portfolio_pid=53690428910006761&Force_direct=true","kind":"Digital object URL","text":"Springer Nature - Springer Computer Science eBooks 2017 English International"}],"literary_form":"Nonfiction","locations":[{"value":"Germany","kind":"Place of Publication"},{"value":"Cham","kind":"Place of Publication"}],"notes":[{"value":["by Marc L. Pusey, Ramazan Savaş Aygün"],"kind":"Title Statement of Responsibility"},{"value":["Includes bibliographical references at the end of each chapters and index"],"kind":"Bibliography Note"}],"physical_description":"1 online resource (XX, 231 p. 66 illus., 56 illus. in color.) ","publishers":[{"name":"Springer International Publishing :","date":"2017","location":"Cham"}],"related_items":[{"description":"Computational Biology, 1568-2684 ; 25","relationship":"In Series"}],"subjects":[{"value":["Bioinformatics"],"kind":"Topical Term"},{"value":["Data mining"],"kind":"Topical Term"},{"value":["Optical data processing"],"kind":"Topical Term"},{"value":["Molecular biology"],"kind":"Topical Term"},{"value":["Biotechnology"],"kind":"Topical Term"},{"value":["Computational Biology/Bioinformatics"],"kind":"Topical Term"},{"value":["Data Mining and Knowledge Discovery"],"kind":"Topical Term"},{"value":["Image Processing and Computer Vision"],"kind":"Topical Term"},{"value":["Molecular Medicine"],"kind":"Topical Term"}],"summary":["This unique text/reference presents an overview of the computational aspects of protein crystallization, describing how to build robotic high-throughput and crystallization analysis systems. The coverage encompasses the complete data analysis cycle, including the set-up of screens by analyzing prior crystallization trials, the classification of crystallization trial images by effective feature extraction, the analysis of crystal growth in time series images, the segmentation of crystal regions in images, the application of focal stacking methods for crystallization images, and the visualization of trials. Topics and features: Describes the fundamentals of protein crystallization, and the scoring and categorization of crystallization image trials Introduces a selection of computational methods for protein crystallization screening, and the hardware and software architecture for a basic high-throughput system Presents an overview of the image features used in protein crystallization classification, and a spatio-temporal analysis of protein crystal growth Examines focal stacking techniques to avoid blurred crystallization images, and different thresholding methods for binarization or segmentation Discusses visualization methods and software for protein crystallization analysis, and reviews alternative methods to X-ray diffraction for obtaining structural information Provides an overview of the current challenges and potential future trends in protein crystallization This interdisciplinary work serves as an essential reference on the computational and data analytics components of protein crystallization for the structural biology community, in addition to computer scientists wishing to enter the field of protein crystallization. Dr. Marc L. Pusey is a Research Scientist at iXpressGenes, Inc. Huntsville, AL, USA. Dr. Ramazan Savaş Aygün is an Associate Professor in the Computer Science Department of the University of Alabama in Huntsville, USA."],"timdex_provenance":{"source":"alma","run_date":"2025-02-28","run_id":"alma-full-ingest-2025-02-28t22-33-35","run_record_offset":188688}},"sort":[30.79344,1483228800000]},{"_index":"alma-2025-03-01t03-00-02","_id":"alma:9935092392506761","_score":30.79344,"_source":{"source":"MIT Alma","source_link":"https://mit.primo.exlibrisgroup.com/discovery/fulldisplay?vid=01MIT_INST:MIT&docid=alma9935092392506761","timdex_record_id":"alma:9935092392506761","title":"Data Analytics in Digital Humanities","call_numbers":["QA75.5-76.95","005.7"],"citation":"Data Analytics in Digital Humanities. 2017. Cham : Springer International Publishing :. Language material. https://mit.primo.exlibrisgroup.com/discovery/fulldisplay?vid=01MIT_INST:MIT&docid=alma9935092392506761","content_type":["Language material"],"contents":["Semantic Web for Cultural Heritage Valorization","Using the Formal Representations of Elementary Events to Set Up Computational Models of Full Narratives","Parody Detection: An Annotation, Feature Construction, and Classification Approach to the Web of Parody","Creating and Analyzing Literary Corpora","Content and Sentiment Analysis on Online Social Networks (OSNs)","The Role of Data in Evaluating the Effectiveness of Networked Learning: An Auto-Ethnographic Evaluation of Four Experiential Learning Projects","Psychological Text Analysis in the Digital Humanities","Parsing Related Tags Networks from Flickr to Explore Crowd-Sourced Keyword Associations","A Case Study of Crowdsourcing Imagery Coding in Natural Disasters","YouTube Comments as Metalanguage Data on Non-standard Languages: The Case of Trinidadian Creole English in Soca Music","Creating Inheritable Digital Codebooks for Qualitative Research Data Analysis","Is it Worth It? The Library and Information Science Degree in the Digital Humanities"],"contributors":[{"value":"Hai-Jew, Shalin","kind":"editor"}],"dates":[{"kind":"Publication date","value":"2017"}],"edition":"1st ed. 2017.","holdings":[{"collection":"Springer Nature - Springer Computer Science eBooks 2017 English International","format":"electronic resource","location":"https://na06.alma.exlibrisgroup.com/view/uresolver/01MIT_INST/openurl?u.ignore_date_coverage=true&portfolio_pid=53690453500006761&Force_direct=true"}],"identifiers":[{"value":"3-319-54499-3","kind":"ISBN"},{"value":"10.1007/978-3-319-54499-1. doi","kind":"Other Identifier"},{"value":"(CKB)3710000001307197","kind":"OCLC Number"},{"value":"(DE-He213)978-3-319-54499-1","kind":"OCLC Number"},{"value":"(MiAaPQ)EBC4854498","kind":"OCLC Number"},{"value":"(PPN)20147218X","kind":"OCLC Number"},{"value":"(EXLCZ)993710000001307197","kind":"OCLC Number"}],"languages":["English"],"links":[{"url":"https://na06.alma.exlibrisgroup.com/view/uresolver/01MIT_INST/openurl?u.ignore_date_coverage=true&portfolio_pid=53690453500006761&Force_direct=true","kind":"Digital object URL","text":"Springer Nature - Springer Computer Science eBooks 2017 English International"}],"literary_form":"Nonfiction","locations":[{"value":"Germany","kind":"Place of Publication"},{"value":"Cham","kind":"Place of Publication"}],"notes":[{"value":["edited by Shalin Hai-Jew"],"kind":"Title Statement of Responsibility"},{"value":["Includes bibliographical references at the end of each chapters"],"kind":"Bibliography Note"}],"physical_description":"1 online resource (XXII, 295 p. 37 illus., 23 illus. in color.) ","publishers":[{"name":"Springer International Publishing :","date":"2017","location":"Cham"}],"related_items":[{"description":"Multimedia Systems and Applications","relationship":"In Series"}],"subjects":[{"value":["Computers"],"kind":"Topical Term"},{"value":["Application software"],"kind":"Topical Term"},{"value":["Computer networks"],"kind":"Topical Term"},{"value":["Artificial intelligence"],"kind":"Topical Term"},{"value":["Information Systems and Communication Service"],"kind":"Topical Term"},{"value":["Computer Appl. in Arts and Humanities"],"kind":"Topical Term"},{"value":["Computer Communication Networks"],"kind":"Topical Term"},{"value":["Artificial Intelligence"],"kind":"Topical Term"}],"summary":["This book covers computationally innovative methods and technologies including data collection and elicitation, data processing, data analysis, data visualizations, and data presentation. It explores how digital humanists have harnessed the hypersociality and social technologies, benefited from the open-source sharing not only of data but of code, and made technological capabilities a critical part of humanities work. Chapters are written by researchers from around the world, bringing perspectives from diverse fields and subject areas. The respective authors describe their work, their research, and their learning. Topics include semantic web for cultural heritage valorization, machine learning for parody detection by classification, psychological text analysis, crowdsourcing imagery coding in natural disasters, and creating inheritable digital codebooks. Designed for researchers and academics, this book is suitable for those interested in methodologies and analytics that can be applied in literature, history, philosophy, linguistics, and related disciplines. Professionals such as librarians, archivists, and historians will also find the content informative and instructive. ."],"timdex_provenance":{"source":"alma","run_date":"2025-12-25","run_id":"alma-daily-ingest-2025-12-25t15-32-27","run_record_offset":5110}},"sort":[30.79344,1483228800000]},{"_index":"alma-2025-03-01t03-00-02","_id":"alma:9935985489406761","_score":30.79344,"_source":{"source":"MIT Alma","source_link":"https://mit.primo.exlibrisgroup.com/discovery/fulldisplay?vid=01MIT_INST:MIT&docid=alma9935985489406761","timdex_record_id":"alma:9935985489406761","title":"Data Analytics and Applied Mathematics","citation":"Data Analytics and Applied Mathematics. Malaysia : Universiti Malaysia Pahang Publishing. Language material. https://mit.primo.exlibrisgroup.com/discovery/fulldisplay?vid=01MIT_INST:MIT&docid=alma9935985489406761","content_type":["Language material"],"holdings":[{"collection":"DOAJ Directory of Open Access Journals","format":"electronic resource","location":"https://na06.alma.exlibrisgroup.com/view/uresolver/01MIT_INST/openurl?u.ignore_date_coverage=true&portfolio_pid=53734187800006761&Force_direct=true","note":"Available from 2020 until 2025."}],"identifiers":[{"value":"2773-4854","kind":"ISSN"},{"value":"(CKB)42026147200041","kind":"OCLC Number"},{"value":"(EXLCZ)9942026147200041","kind":"OCLC Number"}],"languages":["English"],"links":[{"url":"https://na06.alma.exlibrisgroup.com/view/uresolver/01MIT_INST/openurl?u.ignore_date_coverage=true&portfolio_pid=53734187800006761&Force_direct=true","kind":"Digital object URL","text":"DOAJ Directory of Open Access Journals"}],"locations":[{"value":"No place, unknown, or undetermined","kind":"Place of Publication"},{"value":"Malaysia","kind":"Place of Publication"}],"publishers":[{"name":"Universiti Malaysia Pahang Publishing","location":"Malaysia"}],"timdex_provenance":{"source":"alma","run_date":"2026-01-04","run_id":"alma-daily-ingest-2026-01-04t09-29-06","run_record_offset":8313}},"sort":[30.79344,-9223372036854775808]},{"_index":"alma-2025-03-01t03-00-02","_id":"alma:9935705173306761","_score":30.572212,"_source":{"source":"MIT Alma","source_link":"https://mit.primo.exlibrisgroup.com/discovery/fulldisplay?vid=01MIT_INST:MIT&docid=alma9935705173306761","timdex_record_id":"alma:9935705173306761","title":"Data Analytics and Machine Learning : Navigating the Big Data Landscape","call_numbers":["QA76.9.Q36","001.422","005.7"],"citation":"Data Analytics and Machine Learning : Navigating the Big Data Landscape. 2024. Singapore : Springer Nature Singapore :. Language material. https://mit.primo.exlibrisgroup.com/discovery/fulldisplay?vid=01MIT_INST:MIT&docid=alma9935705173306761","content_type":["Language material"],"contents":["Chapter 1. Introduction to Data Analytics, Big Data, and Machine Learning","Chapter 2. Fundamentals of Data Analytics and Lifecycle","Chapter 3. Building Predictive Models with Machine Learning","Chapter 4. Stream data model and architecture","Chapter 5. Leveraging Big Data for Data Analytics","Chapter 6. Advanced Techniques in Data Analytics","Chapter 7. Scalable Machine Learning with Big Data","Chapter 8. Big Data Analytics Framework using Machine Learning on Massive Datasets","Chapter 9. Deep-learning Techniques in Big-Data analytics","Chapter 10. Data Privacy and Ethics in Data Analytics","Chapter 11. Practical Implementation of Machine Learning Techniques & data analytics using R","Chapter 12. Real-World Applications of Data Analytics, Big Data, and Machine Learning","Chapter 13. Implementing Data-Driven Innovation in Organizations","Chapter 14. Business Transformation using Big Data Analytics and Machine Learning","Chapter 15. Future Trends and Emerging Opportunities in HealthAnalytics","Chapter 16. Future Trends in Data Analytics and Machine Learning"],"contributors":[{"value":"Singh, Pushpa","kind":"Not specified"},{"value":"Mishra, Asha Rani","kind":"Not specified"},{"value":"Garg, Payal","kind":"Not specified"}],"dates":[{"kind":"Publication date","value":"2024"}],"edition":"1st ed. 2024.","holdings":[{"collection":"SpringerLink Books Mathematics and Statistics","format":"electronic resource","location":"https://na06.alma.exlibrisgroup.com/view/uresolver/01MIT_INST/openurl?u.ignore_date_coverage=true&portfolio_pid=53692170200006761&Force_direct=true"}],"identifiers":[{"value":"9789819704484","kind":"ISBN"},{"value":"9819704480","kind":"ISBN"},{"value":"10.1007/978-981-97-0448-4. doi","kind":"Other Identifier"},{"value":"(MiAaPQ)EBC31221972","kind":"OCLC Number"},{"value":"(Au-PeEL)EBL31221972","kind":"OCLC Number"},{"value":"(DE-He213)978-981-97-0448-4","kind":"OCLC Number"},{"value":"(CKB)30995669800041","kind":"OCLC Number"},{"value":"1427666886","kind":"OCLC Number"},{"value":"(EXLCZ)9930995669800041","kind":"OCLC Number"}],"languages":["English"],"links":[{"url":"https://na06.alma.exlibrisgroup.com/view/uresolver/01MIT_INST/openurl?u.ignore_date_coverage=true&portfolio_pid=53692170200006761&Force_direct=true","kind":"Digital object URL","text":"SpringerLink Books Mathematics and Statistics"}],"literary_form":"Nonfiction","locations":[{"value":"Singapore","kind":"Place of Publication"}],"notes":[{"value":["edited by Pushpa Singh, Asha Rani Mishra, Payal Garg"],"kind":"Title Statement of Responsibility"},{"value":["Description based on publisher supplied metadata and other sources"],"kind":"Source of Description Note"}],"physical_description":"1 online resource (357 pages)","publishers":[{"name":"Springer Nature Singapore :","date":"2024","location":"Singapore"}],"related_items":[{"description":"Studies in Big Data, 2197-6511 ; 145","relationship":"In Series"}],"subjects":[{"value":["Quantitative research"],"kind":"Topical Term"},{"value":["Machine learning"],"kind":"Topical Term"},{"value":["Natural language processing (Computer science)"],"kind":"Topical Term"},{"value":["Data Analysis and Big Data"],"kind":"Topical Term"},{"value":["Machine Learning"],"kind":"Topical Term"},{"value":["Natural Language Processing (NLP)"],"kind":"Topical Term"},{"value":["Dades massives"],"kind":"Topical Term"},{"value":["Aprenentatge automàtic"],"kind":"Topical Term"}],"summary":["This book presents an in-depth analysis of successful data-driven initiatives, highlighting how organizations have leveraged data to drive decision-making processes, optimize operations, and achieve remarkable outcomes. Through case studies, readers gain valuable insights and learn practical strategies for implementing data analytics, big data, and machine learning solutions in their own organizations. The book discusses the transformative power of data analytics and big data in various industries and sectors and how machine learning applications have revolutionized exploration by enabling advanced data analysis techniques for mapping, geospatial analysis, and environmental monitoring, enhancing our understanding of the world and its dynamic processes. This book explores how big data explosion, the power of analytics and machine learning revolution can bring new prospects and opportunities in the dynamic and data-rich landscape. It highlights the future research directions in data analytics, big data, and machine learning that explores the emerging trends, challenges, and opportunities in these fields by covering interdisciplinary approaches such as handling and analyzing real-time and streaming data."],"timdex_provenance":{"source":"alma","run_date":"2026-02-24","run_id":"alma-daily-ingest-2026-02-24t09-21-06","run_record_offset":2713}},"sort":[30.572212,1704067200000]}]},"aggregations":{"places":{"doc_count":1782053,"only_spatial":{"doc_count":147572,"place_names":{"doc_count_error_upper_bound":536,"sum_other_doc_count":126725,"buckets":[{"key":"arctic ocean","doc_count":3374},{"key":"europe","doc_count":3116},{"key":"united states","doc_count":2671},{"key":"massachusetts","doc_count":2390},{"key":"new jersey","doc_count":2083},{"key":"canada","doc_count":1674},{"key":"china","doc_count":1664},{"key":"earth (planet)","doc_count":1452},{"key":"california","doc_count":1346},{"key":"wisconsin","doc_count":1077}]}}},"languages":{"doc_count_error_upper_bound":36,"sum_other_doc_count":6277,"buckets":[{"key":"english","doc_count":282441},{"key":"eng","doc_count":19187},{"key":"en_us","doc_count":10104},{"key":"en","doc_count":8904},{"key":"in english","doc_count":3171},{"key":"german","doc_count":1696},{"key":"french","doc_count":977},{"key":"fra","doc_count":947},{"key":"spanish","doc_count":895},{"key":"russian","doc_count":772}]},"content_type":{"doc_count_error_upper_bound":2,"sum_other_doc_count":16691,"buckets":[{"key":"language material","doc_count":228427},{"key":"polygon data","doc_count":28600},{"key":"article","doc_count":15681},{"key":"image data","doc_count":13247},{"key":"raster data","doc_count":11629},{"key":"thesis","doc_count":11627},{"key":"manuscript language material","doc_count":9646},{"key":"line data","doc_count":8771},{"key":"point data","doc_count":8135},{"key":"not specified","doc_count":5581}]},"subjects":{"doc_count":1782053,"subject_names":{"doc_count_error_upper_bound":6711,"sum_other_doc_count":1599602,"buckets":[{"key":"datasets","doc_count":53692},{"key":"boundaries","doc_count":26136},{"key":"artificial intelligence","doc_count":24248},{"key":"other","doc_count":21480},{"key":"transportation","doc_count":19587},{"key":"society","doc_count":15058},{"key":"united states","doc_count":10085},{"key":"computer networks","doc_count":9451},{"key":"computational intelligence","doc_count":9229},{"key":"oceans","doc_count":9100}]}},"content_format":{"doc_count_error_upper_bound":0,"sum_other_doc_count":173,"buckets":[{"key":"shapefile","doc_count":45170},{"key":"electronic resource","doc_count":36057},{"key":"geotiff","doc_count":14161},{"key":"tiff","doc_count":11827},{"key":"mixed","doc_count":831},{"key":"jpeg","doc_count":340},{"key":"arcgrid","doc_count":266},{"key":"pdf","doc_count":225},{"key":"las","doc_count":148},{"key":"laz","doc_count":103}]},"literary_form":{"doc_count_error_upper_bound":0,"sum_other_doc_count":0,"buckets":[{"key":"nonfiction","doc_count":219062},{"key":"fiction","doc_count":13722}]},"source":{"doc_count_error_upper_bound":0,"sum_other_doc_count":107,"buckets":[{"key":"mit alma","doc_count":245774},{"key":"opengeometadata gis resources","doc_count":73620},{"key":"dspace@mit","doc_count":29922},{"key":"woods hole open access server","doc_count":2994},{"key":"mit gis resources","doc_count":2029},{"key":"zenodo","doc_count":2013},{"key":"libguides","doc_count":629},{"key":"mit libraries website","doc_count":273},{"key":"mit archivesspace","doc_count":247},{"key":"research databases","doc_count":119}]},"contributors":{"doc_count":1241176,"contributor_names":{"doc_count_error_upper_bound":2065,"sum_other_doc_count":1191596,"buckets":[{"key":"national bureau of economic research","doc_count":12657},{"key":"massachusetts institute of technology. department of electrical engineering and computer science","doc_count":6936},{"key":"institute of electrical and electronics engineers","doc_count":4459},{"key":"boundary solutions, inc.","doc_count":4081},{"key":"geological survey (u.s.)","doc_count":4077},{"key":"collins bartholomew ltd","doc_count":3653},{"key":"massachusetts institute of technology. department of physics","doc_count":3614},{"key":"u.s. department of commerce, bureau of the census, geography division","doc_count":3530},{"key":"arctic climate system (acsys)","doc_count":3349},{"key":"massachusetts institute of technology. department of mechanical engineering","doc_count":3224}]}},"access_to_files":{"doc_count":191520,"only_file_access":{"doc_count":75649,"access_types":{"doc_count_error_upper_bound":0,"sum_other_doc_count":0,"buckets":[{"key":"unknown: check with owning institution","doc_count":73620},{"key":"MIT authentication required","doc_count":1198},{"key":"no authentication required","doc_count":831}]}}}}} + recorded_at: Thu, 30 Apr 2026 22:47:37 GMT +recorded_with: VCR 6.4.0 diff --git a/test/vcr_cassettes/graphql_search_data_analytics_keyword.yml b/test/vcr_cassettes/graphql_search_data_analytics_keyword.yml new file mode 100644 index 00000000..07778329 --- /dev/null +++ b/test/vcr_cassettes/graphql_search_data_analytics_keyword.yml @@ -0,0 +1,50 @@ +--- +http_interactions: +- request: + method: post + uri: http://localhost:9200/all-current/_search + body: + encoding: UTF-8 + string: '{"from":"0","size":20,"query":{"bool":{"should":[{"prefix":{"title.exact_value":{"value":"data + analytics","boost":15.0}}},{"term":{"title":{"value":"data analytics","boost":1.0}}},{"nested":{"path":"contributors","query":{"term":{"contributors.value":{"value":"data + analytics","boost":0.1}}}}}],"must":[{"multi_match":{"query":"data analytics","fields":["alternate_titles","call_numbers","citation","contents","contributors.value","dates.value","edition","funding_information.*","identifiers.value","languages","locations.value","notes.value","numbering","publication_information","subjects.value","summary","title"],"minimum_should_match":"0%"}}],"filter":[]}},"aggregations":{"access_to_files":{"nested":{"path":"rights"},"aggs":{"only_file_access":{"filter":{"terms":{"rights.kind":["Access + to files"]}},"aggs":{"access_types":{"terms":{"field":"rights.description.keyword"}}}}}},"contributors":{"nested":{"path":"contributors"},"aggs":{"contributor_names":{"terms":{"field":"contributors.value.keyword"}}}},"content_type":{"terms":{"field":"content_type"}},"content_format":{"terms":{"field":"format"}},"languages":{"terms":{"field":"languages.keyword"}},"literary_form":{"terms":{"field":"literary_form"}},"places":{"nested":{"path":"subjects"},"aggs":{"only_spatial":{"filter":{"terms":{"subjects.kind":["Dublin + Core; Spatial"]}},"aggs":{"place_names":{"terms":{"field":"subjects.value.keyword"}}}}}},"source":{"terms":{"field":"source"}},"subjects":{"nested":{"path":"subjects"},"aggs":{"subject_names":{"terms":{"field":"subjects.value.keyword"}}}}},"sort":[{"_score":{"order":"desc"}},{"dates.value.as_date":{"order":"desc","nested":{"path":"dates"}}}]}' + headers: + User-Agent: + - 'opensearch-ruby/3.4.0 (RUBY_VERSION: 3.4.9; darwin arm64; Faraday v2.14.0)' + Content-Type: + - application/json + Host: + - localhost:9200 + X-Amz-Date: + - 20260428T204910Z + X-Amz-Content-Sha256: + - "" + Authorization: + - "" + Accept-Encoding: + - gzip;q=1.0,deflate;q=0.6,identity;q=0.3 + Accept: + - "*/*" + response: + status: + code: 200 + message: OK + headers: + Date: + - Tue, 28 Apr 2026 20:49:13 GMT + Content-Type: + - application/json; charset=UTF-8 + Content-Length: + - '96963' + Connection: + - keep-alive + Access-Control-Allow-Origin: + - "*" + body: + encoding: ASCII-8BIT + string: !binary |- + {"took":3196,"timed_out":false,"_shards":{"total":23,"successful":23,"skipped":0,"failed":0},"hits":{"total":{"value":10000,"relation":"gte"},"max_score":null,"hits":[{"_index":"alma-2025-03-01t03-00-02","_id":"alma:9935181015606761","_score":32.33922,"_source":{"source":"MIT Alma","source_link":"https://mit.primo.exlibrisgroup.com/discovery/fulldisplay?vid=01MIT_INST:MIT&docid=alma9935181015606761","timdex_record_id":"alma:9935181015606761","title":"Data analytics and big data","call_numbers":["QA76.9.B45","005.7"],"citation":"Sedkaoui, Soraya (2018): Data analytics and big data. Hoboken, New Jersey : ISTE Ltd/John Wiley and Sons Inc. Language material. https://mit.primo.exlibrisgroup.com/discovery/fulldisplay?vid=01MIT_INST:MIT&docid=alma9935181015606761","content_type":["Language material"],"contents":["Cover","Half-Title Page","Dedication","Title Page","Copyright Page","Contents","Acknowledgments","Preface","Introduction","Why this book?","Whom is this book for?","Organization of the book","Glossary","PART 1 Towards an Understanding of Big Data:Are You Ready?","1. From Data to Big Data: You Must Walk Before You Can Run","1.1. Introduction","1.2. No analytics without data","1.2.1. Databases","1.2.2. Raw data","1.2.3. Text","1.2.4. Images, audios and videos","1.2.5. The Internet of Things","1.3. From bytes to yottabytes: the data revolution","1.4. Big data: definition","1.5. The 3Vs model","1.6. Why now and what does it bring?","1.7. Conclusions","2. Big Data: A Revolution that Changes the Game","2.1. Introduction","2.2. Beyond the 3Vs","2.3. From understanding data to knowledge","2.4. Improving decision-making","2.5. Things to take into account","2.5.1. Data complexity","2.5.2. Data quality: look out! Not all data are the right data","2.5.3. What else?…Data security","2.6. Big data and businesses","2.6.1. Opportunities","2.6.2. Challenges","2.7. Conclusions","PART 2 Big Data Analytics: A Compilation of Advanced Analytics Techniques that Covers a Wide Range of Data","3. Building an Understanding of Big Data Analytics","3.1. Introduction","3.2. Before breaking down the process… What is data analytics?","3.3. Before and after big data analytics","3.4. Traditional versus advanced analytics: What is the difference?","3.5. Advanced analytics: new paradigm","3.6. New statistical and computational paradigm within the big data context","3.7. Conclusions","4. Why Data Analytics and When Can We Use It?","4.1. Introduction","4.2. Understanding the changes in context","4.3. When real time makes the difference","4.4. What should data analytics address?","4.5. Analytics culture within companies","4.6. Big data analytics application: examples","4.7. Conclusions","5. Data Analytics Process: There's Great Work Behind the Scenes","5.1. Introduction","5.2. More data, more questions for better answers","5.2.1. We can never say it enough: \"there is no good wind for those who don't know where they are going\"","5.2.2. Understanding the basics: identify what we already know and what we have yet to find out","5.2.3. Defining the tasks to be accomplished","5.2.4. Which technology to adopt?","5.2.5. Understanding data analytics is good but knowing how to use it is better! (What skills do you need?)","5.2.6. What does the data project cost and how will it pay off in time?","5.2.7. What will it mean to you once you find out?","5.3. Next steps: do you have an idea about a \"secret sauce\"?","5.3.1. First phase: find the data (data collection)","5.3.2. Second phase: construct the data (data preparation)","5.3.3. Third phase: go to exploration and modeling (data analysis)","5.3.4. Fourth phase: evaluate and interpret the results (evaluation and interpretation)","5.3.5. Fifth phase: transform data into actionable knowledge (deploy the model)","5.4. Disciplines that support the big data analytics process","5.4.1. Statistics","5.4.2. Machine learning","5.4.3. Data mining","5.4.4. Text mining","5.4.5. Database management systems","5.4.6. Data streams management systems","5.5. Wait, it's not so simple: what to avoid when building a","5.5.1. Minimize the model error","5.5.2. Maximize the likelihood of the model","5.5.3. What about surveys?","5.6. Conclusions","PART 3 Data Analytics and Machine Learning: the Relevance of Algorithms","6. Machine Learning: a Method of Data Analysis that Automates Analytical Model Building","6.1. Introduction","6.2. From simple descriptive analysis to predictive and prescriptive analyses: what are the different steps?","6.3. Artificial intelligence: algorithms and techniques","6.4. ML: what is it?","6.5. Why is it important?","6.6. How does ML work?","6.6.1. Definition the business need (problem statement) and its formalization","6.6.2. Collection and preparation of the useful data that will be used to meet this need","6.6.3. Test the performance of the obtained model","6.6.4. Optimization and production start","6.7. Data scientist: the new alchemist","6.8. Conclusion","7. Supervised versus Unsupervised Algorithms: a Guided Tour","7.1. Introduction","7.2. Supervised and unsupervised learning","7.2.1. Supervised learning: predict, predict and predict!","7.2.2. Unsupervised learning: go to profiles search!","7.3. Regression versus classification","7.3.1. Regression","7.3.2. Classification","7.4. Clustering gathers data","7.4.1. What good could it serve?","7.4.2. Principle of clustering algorithms","7.4.3. Partitioning your data by using the K-means algorithm","7.5. Conclusion","8. Applications and Examples","8.1. Introduction","8.2. Which algorithm to use?","8.2.1. Supervised or unsupervised algorithm: in which case do we use each one?","8.2.2. What about other ML algorithms?","8.3. The duo big data/ML: examples of use","8.3.1. Netflix: show me what you are looking at and I'll personalize what you like","8.3.2. Amazon: when AI comes into your everyday life","8.3.3. And more: proof that data are a source of creativity","8.4. Conclusions","Bibliography","Index","Other titles from iSTE in Computer Engineering","EULA"],"contributors":[{"value":"Sedkaoui, Soraya","kind":"author"}],"dates":[{"kind":"Publication date","value":"2018"}],"edition":"1st ed.","holdings":[{"collection":"Wiley Online Library","format":"electronic resource","location":"https://na06.alma.exlibrisgroup.com/view/uresolver/01MIT_INST/openurl?u.ignore_date_coverage=true&portfolio_pid=53636613240006761&Force_direct=true"}],"identifiers":[{"value":"9781119528067","kind":"ISBN"},{"value":"1119528062","kind":"ISBN"},{"value":"9781119528050","kind":"ISBN"},{"value":"1119528054","kind":"ISBN"},{"value":"9781119528043","kind":"ISBN"},{"value":"1119528046","kind":"ISBN"},{"value":"(CKB)4100000004385186","kind":"OCLC Number"},{"value":"(Au-PeEL)EBL5401178","kind":"OCLC Number"},{"value":"(CaPaEBR)ebr11564831","kind":"OCLC Number"},{"value":"(PPN)236433105","kind":"OCLC Number"},{"value":"1037945978","kind":"OCLC Number"},{"value":"(MiAaPQ)EBC5401178","kind":"OCLC Number"},{"value":"(Perlego)996164","kind":"OCLC Number"},{"value":"(EXLCZ)994100000004385186","kind":"OCLC Number"}],"languages":["English"],"links":[{"url":"https://na06.alma.exlibrisgroup.com/view/uresolver/01MIT_INST/openurl?u.ignore_date_coverage=true&portfolio_pid=53636613240006761&Force_direct=true","kind":"Digital object URL","text":"Wiley Online Library"}],"literary_form":"Nonfiction","locations":[{"value":"New Jersey","kind":"Place of Publication"},{"value":"Hoboken, New Jersey","kind":"Place of Publication"}],"notes":[{"value":["Soraya Sedkaoui"],"kind":"Title Statement of Responsibility"},{"value":["Includes bibliographical references and index"],"kind":"Bibliography Note"},{"value":["Description based on print version record"],"kind":"Source of Description Note"}],"physical_description":"1 online resource (225 pages)","publishers":[{"name":"ISTE Ltd/John Wiley and Sons Inc","date":"2018","location":"Hoboken, New Jersey"}],"subjects":[{"value":["Big data"],"kind":"Topical Term"},{"value":["Databases"],"kind":"Topical Term"},{"value":["Database management"],"kind":"Topical Term"}],"summary":["The main purpose of this book is to investigate, explore and describe approaches and methods to facilitate data understanding through analytics solutions based on its principles, concepts and applications. But analyzing data is also about involving the use of software. For this, and in order to cover some aspect of data analytics, this book uses software (Excel, SPSS, Python, etc) which can help readers to better understand the analytics process in simple terms and supporting useful methods in its application. "],"timdex_provenance":{"source":"alma","run_date":"2025-04-14","run_id":"alma-daily-ingest-2025-04-14t08-28-27","run_record_offset":5691}},"sort":[32.33922,1514764800000]},{"_index":"alma-2025-03-01t03-00-02","_id":"alma:9936024273806761","_score":32.05078,"_source":{"source":"MIT Alma","source_link":"https://mit.primo.exlibrisgroup.com/discovery/fulldisplay?vid=01MIT_INST:MIT&docid=alma9936024273806761","timdex_record_id":"alma:9936024273806761","title":"Data Analytics Initiatives  : Managing Analytics for Success","call_numbers":["P53.755","001.42"],"citation":"Data Analytics Initiatives  : Managing Analytics for Success. 2022. Milton : Auerbach Publishers, Incorporated. Language material. https://mit.primo.exlibrisgroup.com/discovery/fulldisplay?vid=01MIT_INST:MIT&docid=alma9936024273806761","content_type":["Language material"],"contributors":[{"value":"Bothe, Ondřej","kind":"Not specified"},{"value":"Kubera, Ondřej","kind":"Not specified"},{"value":"Bednář, David","kind":"Not specified"},{"value":"Potančok, Martin","kind":"Not specified"},{"value":"Novotný, Ota","kind":"Not specified"}],"dates":[{"kind":"Publication date","value":"2022"}],"holdings":[{"collection":"Taylor & Francis Discovery Collection","format":"electronic resource","location":"https://www.taylorfrancis.com/books/9781003304081"}],"identifiers":[{"value":"9781000629347","kind":"ISBN"},{"value":"1000629341","kind":"ISBN"},{"value":"9781000629293. (electronic bk.)","kind":"ISBN"},{"value":"1000629295. (electronic bk.)","kind":"ISBN"},{"value":"9781003304081. (electronic bk.)","kind":"ISBN"},{"value":"1003304087. (electronic bk.)","kind":"ISBN"},{"value":"10.1201/9781003304081. doi","kind":"Other Identifier"},{"value":"tayfra9781003304081","kind":"OCLC Number"},{"value":"(NhCcYBP)tayfra9781003304081","kind":"OCLC Number"}],"languages":["English"],"links":[{"url":"https://www.taylorfrancis.com/books/9781003304081","kind":"Digital object URL"},{"url":"https://www.taylorfrancis.com/books/9781003304081","kind":"Digital object URL","text":"Taylor & Francis Discovery Collection"}],"literary_form":"Nonfiction","locations":[{"value":"No place, unknown, or undetermined","kind":"Place of Publication"},{"value":"Milton","kind":"Place of Publication"}],"notes":[{"value":["Description based upon print version of record"],"kind":"General Note"}],"physical_description":"1 online resource (164 p.)","publishers":[{"name":"Auerbach Publishers, Incorporated","date":"2022","location":"Milton"}],"subjects":[{"value":["Quantitative research"],"kind":"Topical Term"},{"value":["Research - Data processing"],"kind":"Topical Term"}],"summary":["The categorisation of analytical projects could help to simplify complexity reasonably and, at the same time, clarify the critical aspects of analytical initiatives. But how can this complex work be categorized? What makes it so complex? Data Analytics Initiatives: Managing Analytics for Success emphasizes that each analytics project is different. At the same time, analytics projects have many common aspects, and these features make them unique compared to other projects. Describing these commonalities helps to develop a conceptual understanding of analytical work. However, features specific to each initiative affects the entire analytics project lifecycle. Neglecting them by trying to use general approaches without tailoring them to each project can lead to failure. In addition to examining typical characteristics of the analytics project and how to categorise them, the book looks at specific types of projects, provides a high-level assessment of their characteristics from a risk perspective, and comments on the most common problems or challenges. The book also presents examples of questions that could be asked of relevant people to analyse an analytics project. These questions help to position properly the project and to find commonalities and general project challenges."],"timdex_provenance":{"source":"alma","run_date":"2026-02-07","run_id":"alma-daily-ingest-2026-02-07t09-21-29","run_record_offset":23276}},"sort":[32.05078,1640995200000]},{"_index":"alma-2025-03-01t03-00-02","_id":"alma:9936019383706761","_score":31.500599,"_source":{"source":"MIT Alma","source_link":"https://mit.primo.exlibrisgroup.com/discovery/fulldisplay?vid=01MIT_INST:MIT&docid=alma9936019383706761","timdex_record_id":"alma:9936019383706761","title":"Data Analytics in Finance","call_numbers":["HG104","332.0285"],"citation":"Data Analytics in Finance. 2025. Boca Raton : CRC Press, Taylor & Francis Group. Language material. https://mit.primo.exlibrisgroup.com/discovery/fulldisplay?vid=01MIT_INST:MIT&docid=alma9936019383706761","content_type":["Language material"],"contributors":[{"value":"Dong, Juijian","kind":"Not specified"}],"dates":[{"kind":"Publication date","value":"2025"}],"edition":"First edition.","holdings":[{"collection":"Taylor & Francis Discovery Collection","format":"electronic resource","location":"https://www.taylorfrancis.com/books/9781003620198"}],"identifiers":[{"value":"1040349749. electronic book","kind":"ISBN"},{"value":"9781040349748. electronic book","kind":"ISBN"},{"value":"9781003620198. electronic book","kind":"ISBN"},{"value":"1003620191. electronic book","kind":"ISBN"},{"value":"9781040349687. electronic book","kind":"ISBN"},{"value":"1040349684. electronic book","kind":"ISBN"},{"value":"10.1201/9781003620198. doi","kind":"Other Identifier"},{"value":"tayfra9781003620198","kind":"OCLC Number"},{"value":"(NhCcYBP)tayfra9781003620198","kind":"OCLC Number"}],"languages":["English"],"links":[{"url":"https://www.taylorfrancis.com/books/9781003620198","kind":"Digital object URL"},{"url":"https://www.taylorfrancis.com/books/9781003620198","kind":"Digital object URL","text":"Taylor & Francis Discovery Collection"}],"literary_form":"Nonfiction","locations":[{"value":"Florida","kind":"Place of Publication"},{"value":"Boca Raton","kind":"Place of Publication"}],"notes":[{"value":["Huijian Dong"],"kind":"Title Statement of Responsibility"},{"value":["\"An Auerbach Book.\""],"kind":"General Note"},{"value":["Includes bibliographical references and index"],"kind":"Bibliography Note"},{"value":["Description based on online resource; title from digital title page (viewed on April 28, 2025)"],"kind":"Source of Description Note"}],"physical_description":"1 online resource","publishers":[{"name":"CRC Press, Taylor & Francis Group","date":"2025","location":"Boca Raton"}],"related_items":[{"description":"Data analytics applications","relationship":"In Series"}],"subjects":[{"value":["Finance - Data processing"],"kind":"Topical Term"}],"summary":["Data Analytics in Finance covers the methods and application of data analytics in all major areas of finance, including buy-side investments, sell-side investment banking, corporate finance, consumer finance, financial services, real estate, insurance, and commercial banking. It explains statistical inference of big data, financial modeling, machine learning, database querying, data engineering, data visualization, and risk analysis. Emphasizing financial data analytics practices with a solution- oriented purpose, it is a \"one-stop-shop\" of all the major data analytics aspects for each major finance area.The book paints a comprehensive picture of the data analytics process including: Statistical inference of big data Financial modeling Machine learning and AI Database querying Data engineering Data visualization Risk analysis Each chapter is crafted to provide complete guidance for many subject areas including investments, fraud detection, and consumption finance. Avoiding data analytics methods widely available elsewhere, the book focuses on providing data analytics methods specifically applied to key areas of finance. Written as a roadmap for researchers, practitioners, and students to master data analytics instruments in finance, the book also provides a collection of indispensable resources for the readers' reference. Offering the knowledge and tools necessary to thrive in a data-driven financial landscape, this book enables readers to deepen their understanding of investments, develop new approaches to risk management, and apply data analytics to finance."],"timdex_provenance":{"source":"alma","run_date":"2026-02-07","run_id":"alma-daily-ingest-2026-02-07t09-21-29","run_record_offset":24583}},"sort":[31.500599,1735689600000]},{"_index":"alma-2025-03-01t03-00-02","_id":"alma:9935705087506761","_score":31.500599,"_source":{"source":"MIT Alma","source_link":"https://mit.primo.exlibrisgroup.com/discovery/fulldisplay?vid=01MIT_INST:MIT&docid=alma9935705087506761","timdex_record_id":"alma:9935705087506761","title":"Data Analytics in Spectroscopy","call_numbers":["Q342","006.3"],"citation":"Dubrovkin, Joseph (2024): Data Analytics in Spectroscopy. Newcastle upon Tyne, England : Cambridge Scholars Publishing. Language material. https://mit.primo.exlibrisgroup.com/discovery/fulldisplay?vid=01MIT_INST:MIT&docid=alma9935705087506761","content_type":["Language material"],"contents":["Intro","Table of Contents","Preface","About the Structure of the Book","Abbreviations","PART I","Introduction","Chapter One","Chapter Two","Chapter Three","Chapter Four","Conclusion","PART II","PART III","Chapter Five","PART IV","Afterword","Appendix A","Appendix B","Appendix C","Appendix D","Appendix E","Appendix F","Appendix G","Appendix H","Appendix I","Bibliography","Index"],"contributors":[{"value":"Dubrovkin, Joseph","kind":"author"}],"dates":[{"kind":"Publication date","value":"2024"}],"edition":"First edition.","holdings":[{"collection":"Ebook Central Perpetual, DDA and Subscription Titles","format":"electronic resource","location":"https://na06.alma.exlibrisgroup.com/view/uresolver/01MIT_INST/openurl?u.ignore_date_coverage=true&portfolio_pid=53692164220006761&Force_direct=true"}],"identifiers":[{"value":"1-5275-8037-7","kind":"ISBN"},{"value":"(MiAaPQ)EBC31136556","kind":"OCLC Number"},{"value":"(Au-PeEL)EBL31136556","kind":"OCLC Number"},{"value":"(EXLCZ)9930322696600041","kind":"OCLC Number"}],"languages":["English"],"links":[{"url":"https://na06.alma.exlibrisgroup.com/view/uresolver/01MIT_INST/openurl?u.ignore_date_coverage=true&portfolio_pid=53692164220006761&Force_direct=true","kind":"Digital object URL","text":"Ebook Central Perpetual, DDA and Subscription Titles"}],"literary_form":"Nonfiction","locations":[{"value":"England","kind":"Place of Publication"},{"value":"Newcastle upon Tyne, England","kind":"Place of Publication"}],"notes":[{"value":["Joseph Dubrovkin"],"kind":"Title Statement of Responsibility"},{"value":["Includes bibliographical references and index"],"kind":"Bibliography Note"},{"value":["Description based on print version record"],"kind":"Source of Description Note"}],"physical_description":"1 online resource (510 pages)","publishers":[{"name":"Cambridge Scholars Publishing","date":"[2024]","location":"Newcastle upon Tyne, England"},{"date":"©2024"}],"subjects":[{"value":["Computational intelligence"],"kind":"Topical Term"},{"value":["Artificial intelligence"],"kind":"Topical Term"},{"value":["Biomedical engineering"],"kind":"Topical Term"}],"summary":["This textbook summarizes various studies and significant materials on data analytics in spectroscopy. Its rigorous mathematical basis, in-depth description, and numerous examples of applications in chemistry and physics make this book valuable for theorists, practitioners, and students specializing in data processing in spectroscopy, chemometrics, and analytical chemistry.The bibliography briefly describes hundreds of data analytics applications for solving spectroscopic tasks in industrial and research laboratories. This book differs from existing brief reviews and articles on this topic in that it forms, for the first time, the big picture of all kinds of data analytics methods in spectroscopy. The book also provides quickly reproducible computer calculations to illustrate its significant theoretical statements. As such, it can also serve as a practical guide to lecturers in data analytics in the broad field of spectroscopy, including chemometrics and analytical chemistry."],"timdex_provenance":{"source":"alma","run_date":"2025-09-26","run_id":"alma-daily-ingest-2025-09-26t08-22-09","run_record_offset":2063}},"sort":[31.500599,1704067200000]},{"_index":"alma-2025-03-01t03-00-02","_id":"alma:9936020329006761","_score":31.500599,"_source":{"source":"MIT Alma","source_link":"https://mit.primo.exlibrisgroup.com/discovery/fulldisplay?vid=01MIT_INST:MIT&docid=alma9936020329006761","timdex_record_id":"alma:9936020329006761","title":"Data Analytics in Spectroscopy","call_numbers":["Q342","006.3"],"citation":"Dubrovkin, Joseph (2024): Data Analytics in Spectroscopy. Newcastle upon Tyne, England : Cambridge Scholars Publishing. Language material. https://mit.primo.exlibrisgroup.com/discovery/fulldisplay?vid=01MIT_INST:MIT&docid=alma9936020329006761","content_type":["Language material"],"contents":["Intro","Table of Contents","Preface","About the Structure of the Book","Abbreviations","PART I","Introduction","Chapter One","Chapter Two","Chapter Three","Chapter Four","Conclusion","PART II","PART III","Chapter Five","PART IV","Afterword","Appendix A","Appendix B","Appendix C","Appendix D","Appendix E","Appendix F","Appendix G","Appendix H","Appendix I","Bibliography","Index"],"contributors":[{"value":"Dubrovkin, Joseph","kind":"author"}],"dates":[{"kind":"Publication date","value":"2024"}],"edition":"First edition.","holdings":[{"collection":"Taylor & Francis Discovery Collection","format":"electronic resource","location":"https://www.taylorfrancis.com/books/9781042824519"}],"identifiers":[{"value":"1527580377","kind":"ISBN"},{"value":"9781527580374","kind":"ISBN"},{"value":"tayfra9781042824519","kind":"OCLC Number"},{"value":"(NhCcYBP)tayfra9781042824519","kind":"OCLC Number"}],"languages":["English"],"links":[{"url":"https://www.taylorfrancis.com/books/9781042824519","kind":"Digital object URL"},{"url":"https://www.taylorfrancis.com/books/9781042824519","kind":"Digital object URL","text":"Taylor & Francis Discovery Collection"}],"literary_form":"Nonfiction","locations":[{"value":"England","kind":"Place of Publication"},{"value":"Newcastle upon Tyne, England","kind":"Place of Publication"}],"notes":[{"value":["Joseph Dubrovkin"],"kind":"Title Statement of Responsibility"},{"value":["Includes bibliographical references and index"],"kind":"Bibliography Note"},{"value":["Description based on print version record"],"kind":"Source of Description Note"}],"physical_description":"1 online resource (510 pages)","publishers":[{"name":"Cambridge Scholars Publishing","date":"[2024]","location":"Newcastle upon Tyne, England"},{"date":"©2024"}],"subjects":[{"value":["Computational intelligence"],"kind":"Topical Term"},{"value":["Artificial intelligence"],"kind":"Topical Term"},{"value":["Biomedical engineering"],"kind":"Topical Term"}],"summary":["This textbook summarizes various studies and significant materials on data analytics in spectroscopy. Its rigorous mathematical basis, in-depth description, and numerous examples of applications in chemistry and physics make this book valuable for theorists, practitioners, and students specializing in data processing in spectroscopy, chemometrics, and analytical chemistry.The bibliography briefly describes hundreds of data analytics applications for solving spectroscopic tasks in industrial and research laboratories. This book differs from existing brief reviews and articles on this topic in that it forms, for the first time, the big picture of all kinds of data analytics methods in spectroscopy. The book also provides quickly reproducible computer calculations to illustrate its significant theoretical statements. As such, it can also serve as a practical guide to lecturers in data analytics in the broad field of spectroscopy, including chemometrics and analytical chemistry."],"timdex_provenance":{"source":"alma","run_date":"2026-02-07","run_id":"alma-daily-ingest-2026-02-07t09-21-29","run_record_offset":56300}},"sort":[31.500599,1704067200000]},{"_index":"alma-2025-03-01t03-00-02","_id":"alma:9935427370706761","_score":31.500599,"_source":{"source":"MIT Alma","source_link":"https://mit.primo.exlibrisgroup.com/discovery/fulldisplay?vid=01MIT_INST:MIT&docid=alma9935427370706761","timdex_record_id":"alma:9935427370706761","title":"Data analytics for cybersecurity","call_numbers":["QA76.9.A25","005.8"],"citation":"Janeja, Vandana P (2022): Data analytics for cybersecurity. Cambridge ; New York, NY : Cambridge University Press. Language material. https://mit.primo.exlibrisgroup.com/discovery/fulldisplay?vid=01MIT_INST:MIT&docid=alma9935427370706761","content_type":["Language material"],"contents":["Introduction - data analytics for cybersecurity","Understanding sources of cybersecurity data","Introduction to data mining : clustering, classification and association rule mining","Big data analytics and its need for cybersecurity","Types of cyber attacks","Anomaly detection for cyber security","Anomaly detection","Cybersecurity through time series and spatial data","Cybersecurity through network and graph data","Human centered data analytics for cyber security","Future directions in data analytics for cybersecurity"],"contributors":[{"value":"Janeja, Vandana P","kind":"author"}],"dates":[{"kind":"Publication date","value":"2022"}],"edition":"First edition.","holdings":[{"collection":"Cambridge eBooks and Partner Presses: Full EBA, All eBooks","format":"electronic resource","location":"https://na06.alma.exlibrisgroup.com/view/uresolver/01MIT_INST/openurl?u.ignore_date_coverage=true&portfolio_pid=53658698790006761&Force_direct=true"}],"identifiers":[{"value":"1-108-24632-X","kind":"ISBN"},{"value":"1-108-23195-0","kind":"ISBN"},{"value":"26930118ECA3DD8EDED4DACA97997439","kind":"OCLC Number"},{"value":"(CKB)24353022000041","kind":"OCLC Number"},{"value":"(UkCbUP)CR9781108231954","kind":"OCLC Number"},{"value":"(MiAaPQ)EBC7109862","kind":"OCLC Number"},{"value":"(Au-PeEL)EBL7109862","kind":"OCLC Number"},{"value":"1286068774","kind":"OCLC Number"},{"value":"(EXLCZ)9924353022000041","kind":"OCLC Number"}],"languages":["English"],"links":[{"url":"https://na06.alma.exlibrisgroup.com/view/uresolver/01MIT_INST/openurl?u.ignore_date_coverage=true&portfolio_pid=53658698790006761&Force_direct=true","kind":"Digital object URL","text":"Cambridge eBooks and Partner Presses: Full EBA, All eBooks"}],"literary_form":"Nonfiction","locations":[{"value":"England","kind":"Place of Publication"},{"value":"Cambridge ; New York, NY","kind":"Place of Publication"}],"notes":[{"value":["Vandana P. Janeja"],"kind":"Title Statement of Responsibility"},{"value":["Title from publisher's bibliographic system (viewed on 10 Aug 2022)"],"kind":"General Note"},{"value":["Includes bibliographical references and index"],"kind":"Bibliography Note"}],"physical_description":"1 online resource (xiii, 192 pages) : digital, PDF file(s).","publishers":[{"name":"Cambridge University Press","date":"2022","location":"Cambridge ; New York, NY"}],"subjects":[{"value":["Computer security - Data processing"],"kind":"Topical Term"},{"value":["Data mining"],"kind":"Topical Term"}],"summary":["As the world becomes increasingly connected, it is also more exposed to a myriad of cyber threats. We need to use multiple types of tools and techniques to learn and understand the evolving threat landscape. Data is a common thread linking various types of devices and end users. Analyzing data across different segments of cybersecurity domains, particularly data generated during cyber-attacks, can help us understand threats better, prevent future cyber-attacks, and provide insights into the evolving cyber threat landscape. This book takes a data oriented approach to studying cyber threats, showing in depth how traditional methods such as anomaly detection can be extended using data analytics and also applies data analytics to non-traditional views of cybersecurity, such as multi domain analysis, time series and spatial data analysis, and human-centered cybersecurity."],"timdex_provenance":{"source":"alma","run_date":"2026-02-12","run_id":"alma-daily-ingest-2026-02-12t09-17-27","run_record_offset":9049}},"sort":[31.500599,1640995200000]},{"_index":"alma-2025-03-01t03-00-02","_id":"alma:9936021890206761","_score":31.500599,"_source":{"source":"MIT Alma","source_link":"https://mit.primo.exlibrisgroup.com/discovery/fulldisplay?vid=01MIT_INST:MIT&docid=alma9936021890206761","timdex_record_id":"alma:9936021890206761","title":"Data analytics and AI","call_numbers":["QA276.4","001.4/22028563"],"citation":"Data analytics and AI. 2021. Boca Raton, FL : CRC Press, Taylor & Francis Group. Language material. https://mit.primo.exlibrisgroup.com/discovery/fulldisplay?vid=01MIT_INST:MIT&docid=alma9936021890206761","content_type":["Language material"],"contributors":[{"value":"Liebowitz, Jay","kind":"editor"}],"dates":[{"kind":"Publication date","value":"2021"}],"edition":"First edition.","holdings":[{"collection":"Taylor & Francis Discovery Collection","format":"electronic resource","location":"https://www.taylorfrancis.com/books/9781003019855"}],"identifiers":[{"value":"2020012383","kind":"LCCN"},{"value":"9781000094657. electronic book","kind":"ISBN"},{"value":"1000094650. electronic book","kind":"ISBN"},{"value":"9781003019855. electronic book","kind":"ISBN"},{"value":"1003019854. electronic book","kind":"ISBN"},{"value":"paperback","kind":"ISBN"},{"value":"hardcover","kind":"ISBN"},{"value":"tayfra9781003019855","kind":"OCLC Number"},{"value":"(NhCcYBP)tayfra9781003019855","kind":"OCLC Number"}],"languages":["English"],"links":[{"url":"https://www.taylorfrancis.com/books/9781003019855","kind":"Digital object URL"},{"url":"https://www.taylorfrancis.com/books/9781003019855","kind":"Digital object URL","text":"Taylor & Francis Discovery Collection"}],"literary_form":"Nonfiction","locations":[{"value":"Florida","kind":"Place of Publication"},{"value":"Boca Raton, FL","kind":"Place of Publication"}],"notes":[{"value":["edited by Jay Liebowitz, Distinguished Chair of Applied Business and Finance, Harrisburg University of Science and Technology"],"kind":"Title Statement of Responsibility"},{"value":["\"An Auerbach Book\" -- taken from title page"],"kind":"General Note"},{"value":["Includes bibliographical references and index"],"kind":"Bibliography Note"},{"value":["Description based on online resource; title from digital title page (viewed on September 29, 2020)"],"kind":"Source of Description Note"}],"physical_description":"1 online resource (xxiii, 242 pages) : illustrations (chiefly color).","publishers":[{"name":"CRC Press, Taylor & Francis Group","date":"2021","location":"Boca Raton, FL"},{"date":"©2021"}],"related_items":[{"description":"Data analytics applications","relationship":"In Series"}],"subjects":[{"value":["Statistics - Data processing"],"kind":"Topical Term"},{"value":["Artificial intelligence"],"kind":"Topical Term"},{"value":["Artificial Intelligence"],"kind":"Topical Term"}],"summary":["\"Two hot topics in recent years are data analytics and AI (artificial intelligence). These areas will continue to grow in importance for the foreseeable future. Unfortunately, both communities have not been communicating and collaborating with each other to build the necessary synergies. This book presents theory, applications, and case studies to bridge the gap between these fields\"--"],"timdex_provenance":{"source":"alma","run_date":"2026-02-07","run_id":"alma-daily-ingest-2026-02-07t09-21-29","run_record_offset":40606}},"sort":[31.500599,1609459200000]},{"_index":"alma-2025-03-01t03-00-02","_id":"alma:9935044073106761","_score":31.500599,"_source":{"source":"MIT Alma","source_link":"https://mit.primo.exlibrisgroup.com/discovery/fulldisplay?vid=01MIT_INST:MIT&docid=alma9935044073106761","timdex_record_id":"alma:9935044073106761","title":"Data Analytics in Sports","call_numbers":["GV716"],"citation":"Barlow, Janine (2015): Data Analytics in Sports. O'Reilly Media, Inc. Language material. https://mit.primo.exlibrisgroup.com/discovery/fulldisplay?vid=01MIT_INST:MIT&docid=alma9935044073106761","content_type":["Language material"],"contributors":[{"value":"Barlow, Janine","kind":"author"}],"dates":[{"kind":"Publication date","value":"2015"}],"edition":"1st edition","holdings":[{"collection":"O'Reilly Online Learning: Academic/Public Library Edition","format":"electronic resource","location":"https://na06.alma.exlibrisgroup.com/view/uresolver/01MIT_INST/openurl?u.ignore_date_coverage=true&portfolio_pid=53540434170006761&Force_direct=true"}],"identifiers":[{"value":"9781491927496","kind":"ISBN"},{"value":"1491927496","kind":"ISBN"},{"value":"(CKB)4920000000456960","kind":"OCLC Number"},{"value":"(CaSebORM)9781491927496","kind":"OCLC Number"},{"value":"1081175812","kind":"OCLC Number"},{"value":"on1081175812","kind":"OCLC Number"},{"value":"(EXLCZ)994920000000456960","kind":"OCLC Number"}],"languages":["English"],"links":[{"url":"https://na06.alma.exlibrisgroup.com/view/uresolver/01MIT_INST/openurl?u.ignore_date_coverage=true&portfolio_pid=53540434170006761&Force_direct=true","kind":"Digital object URL","text":"O'Reilly Online Learning: Academic/Public Library Edition"}],"literary_form":"Fiction","locations":[{"value":"No place, unknown, or undetermined","kind":"Place of Publication"}],"notes":[{"value":["Barlow, Janine"],"kind":"Title Statement of Responsibility"},{"value":["Online resource; Title from title page (viewed September 15, 2015)"],"kind":"Source of Description Note"}],"physical_description":"1 online resource (30 pages)","publishers":[{"name":"O'Reilly Media, Inc","date":"2015"}],"subjects":[{"value":["Sports - Data processing"],"kind":"Topical Term"},{"value":["Sports - Economic aspects"],"kind":"Topical Term"},{"value":["Big data"],"kind":"Topical Term"},{"value":["Information visualization"],"kind":"Topical Term"}],"summary":["As any child with a baseball card intuitively knows, sports and statistics go hand-in-hand. Yet, the general media disdain the flood of sports statistics available today: sports are pure and analytic tools are not. Well, if the so-called purists find tools like baseball’s sabermetrics upsetting, then they’d better brace themselves for the new wave of data analytics. In this O’Reilly report, Janine Barlow examines how advanced predictive analytics are impacting the world of sports—from the rise of tools such as Major League Baseball’s Statcast, which collects data on the movement of balls and players, to SportVU, which the National Basketball Association uses to collect spatial analysis data. You’ll also learn: How \"Dance Card\" makes accurate predictions about NCAA’s \"March Madness\" tournament Why data is crumbling long-standing myths about performance in soccer How the National Football League is using wearable devices to collect vital health data about its players It’s a new world in sports, where data analytics and related information technologies are changing the experience for teams, players, fans, and investors."],"timdex_provenance":{"source":"alma","run_date":"2025-02-28","run_id":"alma-full-ingest-2025-02-28t22-33-35","run_record_offset":75732}},"sort":[31.500599,1420070400000]},{"_index":"alma-2025-03-01t03-00-02","_id":"alma:9935763825606761","_score":30.79974,"_source":{"source":"MIT Alma","source_link":"https://mit.primo.exlibrisgroup.com/discovery/fulldisplay?vid=01MIT_INST:MIT&docid=alma9935763825606761","timdex_record_id":"alma:9935763825606761","title":"Data analytics and digital transformation","call_numbers":["HD30.2","004.0684"],"citation":"Beulen, Erik, Dans, Marla A (2024): Data analytics and digital transformation. London : Routledge, Taylor & Francis Group. Language material. https://mit.primo.exlibrisgroup.com/discovery/fulldisplay?vid=01MIT_INST:MIT&docid=alma9935763825606761","content_type":["Language material"],"contents":["Cover","Endorsements Page","Half Title","Series Page","Title Page","Copyright Page","Table of Contents","List of Figures","List of Tables","About the Authors","Preface","Part 1 Business Context","1 Digital Transformations Explained","2 Data Analytics Trends Clarified","Part 2 Data Analytics Foundation","3 Data-Driven Decision-Making","4 Monetization of data and data Analytics","5 Data Quality - Data Management in Action","6 Data Governance - Business and IT Collaboration","7 Data Compliance, Privacy, and Ethics","Part 3 Digital Transformation Phase Powered by data Analytics","8 Digital 1.0 - Supplementing the Going Concern with Digital Initiatives","9 Digital 2.0 - Siloed Digital to Integrated Digital","10 Digital 3.0 - Preparing for Digital Transformation 2025","Part 4 Data Sharing-Centric Digital Transformations","11 Data Management and Governance Implications of data Sharing","12 Data Sharing - Competitive and Sustainability, Compliance, Privacy, and Ethical Implications","13 Partnering in Ecosystems - How to Structure Collaboration?","Part 5 Aligning at the Crossroads of data Analytics and Digital Transformations","14 Identifying good Practices and Roadmaps for Aligning Analytics and Digital Organizational Goals","15 2030 Perspective on Leveraging data Analytics in Achieving Digital Transformation Success","References","Index"],"contributors":[{"value":"Beulen, Erik","kind":"author"},{"value":"Dans, Marla A","kind":"author"}],"dates":[{"kind":"Publication date","value":"2024"}],"holdings":[{"collection":"Taylor & Francis eBooks Complete","format":"electronic resource","location":"https://na06.alma.exlibrisgroup.com/view/uresolver/01MIT_INST/openurl?u.ignore_date_coverage=true&portfolio_pid=53703335250006761&Force_direct=true"}],"identifiers":[{"value":"9781003246770. (ebk)","kind":"ISBN"},{"value":"100324677X","kind":"ISBN"},{"value":"9781003807353. (ebook)","kind":"ISBN"},{"value":"1003807356","kind":"ISBN"},{"value":"9781003807315","kind":"ISBN"},{"value":"1003807313","kind":"ISBN"},{"value":"(MiAaPQ)EBC30767526","kind":"OCLC Number"},{"value":"(Au-PeEL)EBL30767526","kind":"OCLC Number"},{"value":"(CKB)28446180600041","kind":"OCLC Number"},{"value":"(EXLCZ)9928446180600041","kind":"OCLC Number"}],"languages":["English"],"links":[{"url":"https://na06.alma.exlibrisgroup.com/view/uresolver/01MIT_INST/openurl?u.ignore_date_coverage=true&portfolio_pid=53703335250006761&Force_direct=true","kind":"Digital object URL","text":"Taylor & Francis eBooks Complete"}],"literary_form":"Nonfiction","locations":[{"value":"England","kind":"Place of Publication"},{"value":"London","kind":"Place of Publication"}],"notes":[{"value":["Erik Beulen and Marla A. Dans"],"kind":"Title Statement of Responsibility"},{"value":["Includes bibliographical references and index"],"kind":"Bibliography Note"},{"value":["Description based on print version record"],"kind":"Source of Description Note"}],"physical_description":"1 online resource (257 pages) : illustrations","publishers":[{"name":"Routledge, Taylor & Francis Group","date":"2024","location":"London"},{"date":"©2024"}],"related_items":[{"description":"Business and digital transformation","relationship":"In Series"}],"subjects":[{"value":["Information technology - Management"],"kind":"Topical Term"},{"value":["Big data - Management"],"kind":"Topical Term"},{"value":["Management - Statistical methods"],"kind":"Topical Term"},{"value":["Strategic planning"],"kind":"Topical Term"}],"summary":["Understanding the significance of data analytics is paramount for digital transformation but in many organizations they are separate units without fully aligned goals. As organizations are applying digital transformations to be adaptive and agile in a competitive environment, data analytics can play a critical role in their success. This book explores the crossroads between them and how to leverage their connection for improved business outcomes. The need to collaborate and share data is becoming an integral part of digital transformation. This not only creates new opportunities but also requires well-considered and continuously assessed decision-making as competitiveness is at stake. This book details approaches, concepts, and frameworks, as well as actionable insights and good practices, including combined data management and agile concepts. Critical issues are discussed such as data quality and data governance, as well as compliance, privacy, and ethics. It also offers insights into how both private and public organizations can innovate and keep up with growing data volumes and increasing technological developments in the short, mid, and long term. This book will be of direct appeal to global researchers and students across a range of business disciplines, including technology and innovation management, organizational studies, and strategic management. It is also relevant for policy makers, regulators, and executives of private and public organizations looking to implement successful transformation policies."],"timdex_provenance":{"source":"alma","run_date":"2025-12-24","run_id":"alma-daily-ingest-2025-12-24t14-20-23","run_record_offset":4462}},"sort":[30.79974,1704067200000]},{"_index":"alma-2025-03-01t03-00-02","_id":"alma:9935248399006761","_score":30.79974,"_source":{"source":"MIT Alma","source_link":"https://mit.primo.exlibrisgroup.com/discovery/fulldisplay?vid=01MIT_INST:MIT&docid=alma9935248399006761","timdex_record_id":"alma:9935248399006761","title":"Data analytics using Python visualizations","call_numbers":["QA76.73.P98","005.133"],"citation":"Data analytics using Python visualizations. 2022. [Place of publication not identified] : Packt Publishing. Projected medium. https://mit.primo.exlibrisgroup.com/discovery/fulldisplay?vid=01MIT_INST:MIT&docid=alma9935248399006761","content_type":["Projected medium"],"contributors":[{"value":"Dasgupta, Manas","kind":"presenter"},{"value":"Packt Publishing","kind":"publisher"}],"dates":[{"kind":"Publication date","value":"2022"}],"edition":"[First edition].","holdings":[{"collection":"O'Reilly Online Learning: Academic/Public Library Edition","format":"electronic resource","location":"https://na06.alma.exlibrisgroup.com/view/uresolver/01MIT_INST/openurl?u.ignore_date_coverage=true&portfolio_pid=53647178910006761&Force_direct=true"}],"identifiers":[{"value":"9781804614839","kind":"ISBN"},{"value":"1804614831","kind":"ISBN"},{"value":"(CKB)5590000000932030","kind":"OCLC Number"},{"value":"1334599801","kind":"OCLC Number"},{"value":"(OCoLC-P)1334599801","kind":"OCLC Number"},{"value":"(CaSebORM)9781804614839","kind":"OCLC Number"},{"value":"(EXLCZ)995590000000932030","kind":"OCLC Number"}],"languages":["English"],"links":[{"url":"https://na06.alma.exlibrisgroup.com/view/uresolver/01MIT_INST/openurl?u.ignore_date_coverage=true&portfolio_pid=53647178910006761&Force_direct=true","kind":"Digital object URL","text":"O'Reilly Online Learning: Academic/Public Library Edition"}],"locations":[{"value":"No place, unknown, or undetermined","kind":"Place of Publication"},{"value":"[Place of publication not identified]","kind":"Place of Publication"}],"notes":[{"value":["\"Updated in June 2022.\""],"kind":"General Note"},{"value":["OCLC-licensed vendor bibliographic record"],"kind":"Source of Description Note"}],"physical_description":"1 online resource (1 video file (6 hr., 28 min.)) : sound, color.","publishers":[{"name":"Packt Publishing","date":"[2022]","location":"[Place of publication not identified]"}],"subjects":[{"value":["Computer science"],"kind":"Topical Term"},{"value":["Python (Computer program language)"],"kind":"Topical Term"},{"value":["Electronic data processing"],"kind":"Topical Term"}],"summary":["Master data science, ML, and analytics with powerful visualizations using Matplotlib, Seaborn, and Bokeh. About This Video The art of presenting data in the form of powerful, innovative, and intuitive visualizations In-depth coverage of Matplotlib, Seaborn, and Bokeh visualization libraries Use of data analytics techniques/Exploratory Data Analysis (EDA) using several data generations and manipulation methods In Detail If you are working on machine learning projects and want to find patterns and insights from your data on your way to building models, then this course is for you. This course takes a holistic approach to teach visualization techniques. We will be taking real-life business scenarios and raw data to go through detailed Exploratory Data Analysis (EDA) techniques to prepare the raw data to suit the appropriate visualization needs. You will learn about data analytics and exploratory data analysis techniques using multiple different data structures with NumPy and Pandas libraries. You will also learn various chart/graph types, customization/configuration, and vectorization techniques. We will look at advanced visualizations using business applications such as single and multiple bar charts, pie charts, and bubble charts with the vectorization of properties. We will further explore Seaborn Boxplot, Violin plot, Categorical Scatterplot, and how to create heat maps. By the end of the course, you will learn the foundational techniques of data analytics and deeper customizations on visualizations. You will be able to confidently use Python visualization libraries such as Matplotlib, Seaborn, and Bokeh in your future projects.\\ Audience This course is for Python and machine learning developers, data scientists, data analysts, and business analysts. This course will also be beneficial to leaders, managers, and anyone whose job involves presenting data in the form of visuals, which include developers, architects, and system analysts. A basic understanding of Python will be helpful, but not mandatory."],"timdex_provenance":{"source":"alma","run_date":"2025-02-28","run_id":"alma-full-ingest-2025-02-28t22-33-35","run_record_offset":196493}},"sort":[30.79974,1640995200000]},{"_index":"alma-2025-03-01t03-00-02","_id":"alma:9935444795806761","_score":30.79974,"_source":{"source":"MIT Alma","source_link":"https://mit.primo.exlibrisgroup.com/discovery/fulldisplay?vid=01MIT_INST:MIT&docid=alma9935444795806761","timdex_record_id":"alma:9935444795806761","title":"Data analytics using Python visualizations","alternate_titles":[{"value":"Title on screen: Complete 2021 Python visualizations bootcamp","kind":"Varying Form of Title"}],"call_numbers":["QA76.73.P98","005.133"],"citation":"Dasgupta, Manas (Solutions architect) (2022): Data analytics using Python visualizations. Birmingham, England : PACKT Publishing. Projected medium. https://mit.primo.exlibrisgroup.com/discovery/fulldisplay?vid=01MIT_INST:MIT&docid=alma9935444795806761","content_type":["Projected medium"],"contributors":[{"value":"Dasgupta, Manas (Solutions architect)","kind":"author"},{"value":"Dasgupta, Manas (Solutions architect)","kind":"instructor"},{"value":"Packt Publishing","kind":"production company"},{"value":"Packt Publishing","kind":"publisher"}],"dates":[{"kind":"Publication date","value":"2022"}],"edition":"[First edition].","holdings":[{"collection":"Academic Video Online (AVON)","format":"electronic resource","location":"https://na06.alma.exlibrisgroup.com/view/uresolver/01MIT_INST/openurl?u.ignore_date_coverage=true&portfolio_pid=53660982330006761&Force_direct=true"}],"identifiers":[{"value":"(CKB)5590000001028878","kind":"OCLC Number"},{"value":"1334599801","kind":"OCLC Number"},{"value":"(VaAlASP)5373529","kind":"OCLC Number"},{"value":"(VaAlASP)ASP5373529/marc","kind":"OCLC Number"},{"value":"(OCoLC-P)1334599801","kind":"OCLC Number"},{"value":"(CaSebORM)9781804614839","kind":"OCLC Number"},{"value":"(EXLCZ)995590000001028878","kind":"OCLC Number"}],"languages":["English","In English"],"links":[{"url":"https://na06.alma.exlibrisgroup.com/view/uresolver/01MIT_INST/openurl?u.ignore_date_coverage=true&portfolio_pid=53660982330006761&Force_direct=true","kind":"Digital object URL","text":"Academic Video Online (AVON)"}],"locations":[{"value":"England","kind":"Place of Publication"},{"value":"Birmingham, England","kind":"Place of Publication"}],"notes":[{"value":["Manas Dasgupta"],"kind":"Title Statement of Responsibility"},{"value":["Title from resource description page (viewed March 13, 2023)"],"kind":"General Note"},{"value":["Manas Dasgupta, presenter"],"kind":"Participant or Performer Note"}],"physical_description":"1 online resource (387 minutes)","publishers":[{"name":"PACKT Publishing","date":"2022","location":"Birmingham, England"}],"subjects":[{"value":["Electronic data processing"],"kind":"Topical Term"},{"value":["Information visualization"],"kind":"Topical Term"},{"value":["Python (Computer program language)"],"kind":"Topical Term"},{"value":["Visual analytics"],"kind":"Topical Term"}],"summary":["f you are working on machine learning projects and want to find patterns and insights from your data on your way to building models, then this course is for you. This course takes a holistic approach to teach visualization techniques.  We will be taking real-life business scenarios and raw data to go through detailed Exploratory Data Analysis (EDA) techniques to prepare the raw data to suit the appropriate visualization needs. You will learn about data analytics and exploratory data analysis techniques using multiple different data structures with NumPy and Pandas libraries. You will also learn various chart/graph types, customization/configuration, and vectorization techniques.  We will look at advanced visualizations using business applications such as single and multiple bar charts, pie charts, and bubble charts with the vectorization of properties. We will further explore Seaborn Boxplot, Violin plot, Categorical Scatterplot, and how to create heat maps.  By the end of the course, you will learn the foundational techniques of data analytics and deeper customizations on visualizations. You will be able to confidently use Python visualization libraries such as Matplotlib, Seaborn, and Bokeh in your future projects."],"timdex_provenance":{"source":"alma","run_date":"2026-03-26","run_id":"alma-daily-ingest-2026-03-26t08-31-22","run_record_offset":6857}},"sort":[30.79974,1640995200000]},{"_index":"alma-2025-03-01t03-00-02","_id":"alma:9935199842206761","_score":30.79974,"_source":{"source":"MIT Alma","source_link":"https://mit.primo.exlibrisgroup.com/discovery/fulldisplay?vid=01MIT_INST:MIT&docid=alma9935199842206761","timdex_record_id":"alma:9935199842206761","title":"Data Analytics in Power Markets","call_numbers":["HD9685.A2","363.620212"],"citation":"Chen, Qixin (2021): Data Analytics in Power Markets. Singapore : Springer Nature Singapore :. Language material. https://mit.primo.exlibrisgroup.com/discovery/fulldisplay?vid=01MIT_INST:MIT&docid=alma9935199842206761","content_type":["Language material"],"contents":["Introduction to power market data and their characteristics","Modeling load forecasting uncertainty using deep learning models","Data-driven load data cleaning and its impacts on forecasting performance","Generalized cost-oriented load forecasting in economic dispatch","A monthly electricity consumption forecasting method","Data-driven pattern extraction for analyzing market bidding behaviors","Stochastic optimal offering based on probabilistic forecast on aggregated supply curves","Power market simulation framework based on learning from individual offering strategy","Deep inverse reinforcement learning for reward function identification in bidding models","The subspace characteristics and congestion identification of LMP data","Online transmission topology identification in LMP-based markets","Day-ahead componential electricity price forecasting","Quantifying the impact of price forecasting error on market bidding","Virtual bidding and FTR speculation based on probabilistic LMP forecasting","Abnormal detection of LMP scenario and data with deep neural networks"],"contributors":[{"value":"Chen, Qixin","kind":"author"}],"dates":[{"kind":"Publication date","value":"2021"}],"edition":"1st ed. 2021.","holdings":[{"collection":"SpringerLink Books Energy","format":"electronic resource","location":"https://na06.alma.exlibrisgroup.com/view/uresolver/01MIT_INST/openurl?u.ignore_date_coverage=true&portfolio_pid=53635138920006761&Force_direct=true"}],"identifiers":[{"value":"981-16-4975-8","kind":"ISBN"},{"value":"10.1007/978-981-16-4975-2. doi","kind":"Other Identifier"},{"value":"(CKB)5360000000049948","kind":"OCLC Number"},{"value":"(MiAaPQ)EBC6739146","kind":"OCLC Number"},{"value":"(Au-PeEL)EBL6739146","kind":"OCLC Number"},{"value":"1273475861","kind":"OCLC Number"},{"value":"(PPN)25830295X","kind":"OCLC Number"},{"value":"(DE-He213)978-981-16-4975-2","kind":"OCLC Number"},{"value":"(EXLCZ)995360000000049948","kind":"OCLC Number"}],"languages":["English"],"links":[{"url":"https://na06.alma.exlibrisgroup.com/view/uresolver/01MIT_INST/openurl?u.ignore_date_coverage=true&portfolio_pid=53635138920006761&Force_direct=true","kind":"Digital object URL","text":"SpringerLink Books Energy"}],"literary_form":"Nonfiction","locations":[{"value":"Singapore","kind":"Place of Publication"}],"notes":[{"value":["by Qixin Chen, Hongye Guo, Kedi Zheng, Yi Wang"],"kind":"Title Statement of Responsibility"}],"physical_description":"1 online resource (291 pages)","publishers":[{"name":"Springer Nature Singapore :","date":"2021","location":"Singapore"}],"subjects":[{"value":["Energy policy"],"kind":"Topical Term"},{"value":["Machine learning"],"kind":"Topical Term"},{"value":["Electric power production"],"kind":"Topical Term"},{"value":["Power resources"],"kind":"Topical Term"},{"value":["Environmental economics"],"kind":"Topical Term"},{"value":["Energy Policy, Economics and Management"],"kind":"Topical Term"},{"value":["Machine Learning"],"kind":"Topical Term"},{"value":["Electrical Power Engineering"],"kind":"Topical Term"},{"value":["Resource and Environmental Economics"],"kind":"Topical Term"}],"summary":["This book aims to solve some key problems in the decision and optimization procedure for power market organizers and participants in data-driven approaches. It begins with an overview of the power market data and analyzes on their characteristics and importance for market clearing. Then, the first part of the book discusses the essential problem of bus load forecasting from the perspective of market organizers. The related works include load uncertainty modeling, bus load bad data correction, and monthly load forecasting. The following part of the book answers how much information can be obtained from public data in locational marginal price (LMP)-based markets. It introduces topics such as congestion identification, componential price forecasting, quantifying the impact of forecasting error, and financial transmission right investment. The final part of the book answers how to model the complex market bidding behaviors. Specific works include pattern extraction, aggregated supply curve forecasting, market simulation, and reward function identification in bidding. These methods are especially useful for market organizers to understand the bidding behaviors of market participants and make essential policies. It will benefit and inspire researchers, graduate students, and engineers in the related fields."],"timdex_provenance":{"source":"alma","run_date":"2025-11-07","run_id":"alma-daily-ingest-2025-11-07t09-25-08","run_record_offset":21881}},"sort":[30.79974,1609459200000]},{"_index":"alma-2025-03-01t03-00-02","_id":"alma:9936020869006761","_score":30.79974,"_source":{"source":"MIT Alma","source_link":"https://mit.primo.exlibrisgroup.com/discovery/fulldisplay?vid=01MIT_INST:MIT&docid=alma9936020869006761","timdex_record_id":"alma:9936020869006761","title":"Data analytics in project management","call_numbers":["HD69.P75","658.4/040285"],"citation":"Data analytics in project management. 2019. Boca Raton, FL : CRC Press, Taylor and Francis Group. Language material. https://mit.primo.exlibrisgroup.com/discovery/fulldisplay?vid=01MIT_INST:MIT&docid=alma9936020869006761","content_type":["Language material"],"contents":["Why data analytics in project management?","J. Davidson Frame and Yanping Chen","Data analytics risk : lost in translation?","Carl Pritchard","Analytical challenges of a modern PMO","Seweryn Spalek","Data analytics and project portfolio management","Alfonso Bucero","Earned value method","Werner Meyer","How to manage big data issues in a project environment","Ryan Legard","IT solutions of data analytics as applied to project management","Michael Bragen","Conventional and unconventional data mining for better decision-making","Klas Skogmar","Agile project management and data analytics","Deanne Larson","Data analytics and scrum","Bert Brijs"],"contributors":[{"value":"Spalek, Seweryn","kind":"editor"}],"dates":[{"kind":"Publication date","value":"2019"}],"holdings":[{"collection":"Taylor & Francis Discovery Collection","format":"electronic resource","location":"https://www.taylorfrancis.com/books/9780429434891"}],"identifiers":[{"value":"2020692569","kind":"LCCN"},{"value":"9780429786358. epub","kind":"ISBN"},{"value":"0429786352","kind":"ISBN"},{"value":"alk. paper","kind":"ISBN"},{"value":"9780429786365","kind":"ISBN"},{"value":"0429786360","kind":"ISBN"},{"value":"0429434898. (electronic bk.)","kind":"ISBN"},{"value":"9780429786341. (electronic bk. ;. Mobipocket)","kind":"ISBN"},{"value":"0429786344. (electronic bk. ;. Mobipocket)","kind":"ISBN"},{"value":"9780429434891. (electronic bk.)","kind":"ISBN"},{"value":"10.1201/9780429434891. doi","kind":"Other Identifier"},{"value":"tayfra9780429434891","kind":"OCLC Number"},{"value":"(NhCcYBP)tayfra9780429434891","kind":"OCLC Number"}],"languages":["English"],"links":[{"url":"https://www.taylorfrancis.com/books/9780429434891","kind":"Digital object URL"},{"url":"https://www.taylorfrancis.com/books/9780429434891","kind":"Digital object URL","text":"Taylor & Francis Discovery Collection"}],"literary_form":"Nonfiction","locations":[{"value":"Florida","kind":"Place of Publication"},{"value":"Boca Raton, FL","kind":"Place of Publication"}],"notes":[{"value":["edited by Seweryn Spalek"],"kind":"Title Statement of Responsibility"},{"value":["Includes bibliographical references and index"],"kind":"Bibliography Note"},{"value":["Description based on print version record"],"kind":"Source of Description Note"}],"physical_description":"1 online resource","publishers":[{"name":"CRC Press, Taylor and Francis Group","date":"[2019]","location":"Boca Raton, FL"}],"related_items":[{"description":"Data analytics applications","relationship":"In Series"}],"subjects":[{"value":["Project management - Data processing"],"kind":"Topical Term"},{"value":["Project management - Statistical methods"],"kind":"Topical Term"}],"summary":["This book aims to help the reader better understand the importance of data analysis in project management. Moreover, it provides guidance by showing tools, methods, techniques and lessons learned on how to better utilize the data gathered from the projects. First and foremost, insight into the bridge between data analytics and project management aids practitioners looking for ways to maximize the practical value of data procured. The book equips organizations with the know-how necessary to adapt to a changing workplace dynamic through key lessons learned from past ventures. The book's integrated approach to investigating both fields enhances the value of research findings."],"timdex_provenance":{"source":"alma","run_date":"2026-02-07","run_id":"alma-daily-ingest-2026-02-07t09-21-29","run_record_offset":60143}},"sort":[30.79974,1546300800000]},{"_index":"alma-2025-03-01t03-00-02","_id":"alma:9936021139106761","_score":30.79974,"_source":{"source":"MIT Alma","source_link":"https://mit.primo.exlibrisgroup.com/discovery/fulldisplay?vid=01MIT_INST:MIT&docid=alma9936021139106761","timdex_record_id":"alma:9936021139106761","title":"Data analytics applications in education","call_numbers":["LB1028.43","370.285"],"citation":"Data analytics applications in education. 2018. Boca Raton, FL : CRC Press. Language material. https://mit.primo.exlibrisgroup.com/discovery/fulldisplay?vid=01MIT_INST:MIT&docid=alma9936021139106761","content_type":["Language material"],"contents":["Big data analytics in a learning environment / Kristof De Witte and Jan Vanthienen","Improved student feedback with process and data analytics / Johannes De Smedt, Seppe vanden Broucke, Jan Vanthienen and Kristof De Witte","Towards data for development : a model on learning communities as a platform for growing data use / Wouter Schelfhout","The impact of fraudulent behavior on the usefulness of learning analytics applications : the case of question and answer sharing with medium-stakes online quizzing in higher education / Silvester Draaijer and Chris van Klaveren","Disentangling faculty efficiency from students' effort / Cristian Barra, Sergio Destefanis, Vania Sena and Roberto Zotti","Using data analytics to benchmark schools : the case of Portugal / Maria Conceição Portela and Ana S. Camanho","The use of educational data mining procedures to assess students' performance in a bayesian framework / Kristof De Witte, Grazia Graziosi and Joris Hindryckx","Using statistical analytics to study school performance through administrative datasets / Tommaso Agasisti, Francesca Ieva, Chiara Masci, Anna Maria Paganoni, and Mara Soncin","The governance of big data in higher education / Kurt De Wit and Bruno Broucker","Evidence based education and its implications for research and data analytics with an application to the overeducation literature / Wim Groot and Henriëtte Maassen van den Brink"],"contributors":[{"value":"Vanthienen, Jan","kind":"editor"},{"value":"Witte, K. de (Kristof)","kind":"editor"}],"dates":[{"kind":"Publication date","value":"2018"}],"holdings":[{"collection":"Taylor & Francis Discovery Collection","format":"electronic resource","location":"https://www.taylorfrancis.com/books/9781315154145"}],"identifiers":[{"value":"9781351650182 (electronic bk.)","kind":"ISBN"},{"value":"1351650181 (electronic bk.)","kind":"ISBN"},{"value":"tayfra9781315154145","kind":"OCLC Number"},{"value":"(NhCcYBP)tayfra9781315154145","kind":"OCLC Number"}],"languages":["English"],"links":[{"url":"https://www.taylorfrancis.com/books/9781315154145","kind":"Digital object URL"},{"url":"https://www.taylorfrancis.com/books/9781315154145","kind":"Digital object URL","text":"Taylor & Francis Discovery Collection"}],"literary_form":"Nonfiction","locations":[{"value":"Florida","kind":"Place of Publication"},{"value":"Boca Raton, FL","kind":"Place of Publication"}],"notes":[{"value":["edited by Jan Vanthienen and Kristof De Witte"],"kind":"Title Statement of Responsibility"},{"value":["Includes bibliographical references"],"kind":"Bibliography Note"},{"value":["Description based on print version record"],"kind":"Source of Description Note"}],"physical_description":"1 online resource (pages cm.)","publishers":[{"name":"CRC Press","date":"2018","location":"Boca Raton, FL"}],"subjects":[{"value":["Education - Data processing"],"kind":"Topical Term"},{"value":["Educational statistics"],"kind":"Topical Term"},{"value":["Big data"],"kind":"Topical Term"}],"timdex_provenance":{"source":"alma","run_date":"2026-02-07","run_id":"alma-daily-ingest-2026-02-07t09-21-29","run_record_offset":64310}},"sort":[30.79974,1514764800000]},{"_index":"alma-2025-03-01t03-00-02","_id":"alma:9935440988006761","_score":30.79974,"_source":{"source":"MIT Alma","source_link":"https://mit.primo.exlibrisgroup.com/discovery/fulldisplay?vid=01MIT_INST:MIT&docid=alma9935440988006761","timdex_record_id":"alma:9935440988006761","title":"Data Analytics for Smart Cities","call_numbers":["TD159.4","307.760285"],"citation":"Data Analytics for Smart Cities. 2018. Milton : Auerbach Publications. Language material. https://mit.primo.exlibrisgroup.com/discovery/fulldisplay?vid=01MIT_INST:MIT&docid=alma9935440988006761","content_type":["Language material"],"contents":["Smartphone technology integrated with machine learning for airport pavement condition assessment / Amir Alavi, William Buttlar","Global satellite observations for smart cities / Zhong Liu, Menglin S. Jin, Jacqueline Liu, Angela Li, William Teng, Bruce Vollmer, and D. Meyer","Advancing smart and resilient cities with big spatial disaster data : challenges, progresses, and opportunities / Xuan Hu and Jie Gong","Smart city portrayal : dynamic visualization applied to the analysis of underground metro / Evgheni Polisciuc and Penousal Machado","Smart bike-sharing systems for smart cities / Hesham A. Rakha","Indirect monitoring of critical transport infrastructure : data analytics and signal processing / Abdollah Malekjafarian","Big data exploration to examine aggressive driving behavior in the era of smart cities / Arash Jahangiri","Exploratory analysis of run-off-road crash patterns / Mohammad Jalayer","Predicting traffic safety risk factors using an ensemble classifier / Nasim Arbabzadeh","Architecture design of internet of things-enabled cloud platform for managing the production of prefabricated public houses / Clyde Zhengdao Li"],"contributors":[{"value":"Alavi, Amir","kind":"Not specified"},{"value":"Buttlar, William G","kind":"Not specified"}],"dates":[{"kind":"Publication date","value":"2018"}],"edition":"1st ed.","holdings":[{"collection":"Taylor & Francis eBooks Complete","format":"electronic resource","location":"https://na06.alma.exlibrisgroup.com/view/uresolver/01MIT_INST/openurl?u.ignore_date_coverage=true&portfolio_pid=53660230530006761&Force_direct=true"}],"identifiers":[{"value":"0-429-43498-7","kind":"ISBN"},{"value":"0-429-78662-X","kind":"ISBN"},{"value":"0-429-78663-8","kind":"ISBN"},{"value":"(CKB)4100000007121405","kind":"OCLC Number"},{"value":"(MiAaPQ)EBC5566778","kind":"OCLC Number"},{"value":"1061098835","kind":"OCLC Number"},{"value":"(OCoLC-P)1061098835","kind":"OCLC Number"},{"value":"(FlBoTFG)9780429434983","kind":"OCLC Number"},{"value":"(EXLCZ)994100000007121405","kind":"OCLC Number"}],"languages":["English"],"links":[{"url":"https://na06.alma.exlibrisgroup.com/view/uresolver/01MIT_INST/openurl?u.ignore_date_coverage=true&portfolio_pid=53660230530006761&Force_direct=true","kind":"Digital object URL","text":"Taylor & Francis eBooks Complete"}],"literary_form":"Nonfiction","locations":[{"value":"No place, unknown, or undetermined","kind":"Place of Publication"},{"value":"Milton","kind":"Place of Publication"}],"notes":[{"value":["edited by Amir H. Alavi, William G. Buttlar"],"kind":"Title Statement of Responsibility"},{"value":["4.3.2 Color-Coding"],"kind":"General Note"},{"value":["Includes bibliographical references and index"],"kind":"Bibliography Note"},{"value":["Description based on print version record"],"kind":"Source of Description Note"}],"physical_description":"1 online resource (255 pages) : illustrations (some color).","publishers":[{"name":"Auerbach Publications","date":"2018","location":"Milton"}],"related_items":[{"description":"Data analytics applications","relationship":"In Series"}],"subjects":[{"value":["Smart cities"],"kind":"Topical Term"},{"value":["Big data"],"kind":"Topical Term"},{"value":["Quantitative research"],"kind":"Topical Term"}],"summary":["The development of smart cities is one of the most important challenges over the next few decades. Governments and companies are leveraging billions of dollars in public and private funds for smart cities. Next generation smart cities are heavily dependent on distributed smart sensing systems and devices to monitor the urban infrastructure. The smart sensor networks serve as autonomous intelligent nodes to measure a variety of physical or environmental parameters. They should react in time, establish automated control, and collect information for intelligent decision-making. In this context, one of the major tasks is to develop advanced frameworks for the interpretation of the huge amount of information provided by the emerging testing and monitoring systems. Data Analytics for Smart Cities brings together some of the most exciting new developments in the area of integrating advanced data analytics systems into smart cities along with complementary technological paradigms such as cloud computing and Internet of Things (IoT). The book serves as a reference for researchers and engineers in domains of advanced computation, optimization, and data mining for smart civil infrastructure condition assessment, dynamic visualization, intelligent transportation systems (ITS), cyber-physical systems, and smart construction technologies. The chapters are presented in a hands-on manner to facilitate researchers in tackling applications. Arguably, data analytics technologies play a key role in tackling the challenge of creating smart cities. Data analytics applications involve collecting, integrating, and preparing time- and space-dependent data produced by sensors, complex engineered systems, and physical assets, followed by developing and testing analytical models to verify the accuracy of results. This book covers this multidisciplinary field and examines multiple paradigms such as machine learning, pattern recognition, statistics, intelligent databases, knowledge acquisition, data visualization, high performance computing, and expert systems. The book explores new territory by discussing the cutting-edge concept of Big Data analytics for interpreting massive amounts of data in smart city applications."],"timdex_provenance":{"source":"alma","run_date":"2025-12-24","run_id":"alma-daily-ingest-2025-12-24t14-20-23","run_record_offset":1734}},"sort":[30.79974,1514764800000]},{"_index":"alma-2025-03-01t03-00-02","_id":"alma:9936022186606761","_score":30.79974,"_source":{"source":"MIT Alma","source_link":"https://mit.primo.exlibrisgroup.com/discovery/fulldisplay?vid=01MIT_INST:MIT&docid=alma9936022186606761","timdex_record_id":"alma:9936022186606761","title":"Data analytics for internal auditors","call_numbers":["HF5668","657/.458"],"citation":"Cascarino, Richard (2017): Data analytics for internal auditors. Boca Raton : CRC Press, Taylor & Francis Group. Language material. https://mit.primo.exlibrisgroup.com/discovery/fulldisplay?vid=01MIT_INST:MIT&docid=alma9936022186606761","content_type":["Language material"],"contents":["Chapter 1. Introduction to data analysis","chapter 2. Understanding sampling","chapter 3. Judgmental versus statistical sampling","chapter 4. Probability theory in data analysis","chapter 5. Types of evidence","chapter 6. Population analysis","chapter 7. Correlations, regressions, and other analyses","chapter 8. Conducting the audit","chapter 9. Obtaining information from IT systems for analysis","chapter 10. Use of computer-assisted audit techniques","chapter 11. Analysis of big data","chapter 12. Results analysis and validation","chapter 13. Fraud detection using data analysis","chapter 14. Root cause analysis","chapter 15. Data analysis and continuous monitoring","chapter 16. Continous auditing","chapter 17. Financial analysis","chapter 18. Excel and data analysis","chapter 19. ACL and data analysis","chapter 20. IDEA and data analysis","chapter 21. SAS and data analysis","chapter 22. Analysis reporting","chapter 23. Data visualization and presentation","chapte 24. Conclusion"],"contributors":[{"value":"Cascarino, Richard","kind":"author"}],"dates":[{"kind":"Publication date","value":"2017"}],"holdings":[{"collection":"Taylor & Francis Discovery Collection","format":"electronic resource","location":"https://www.taylorfrancis.com/books/9781315369532"}],"identifiers":[{"value":"9781498737159. (electronic bk.)","kind":"ISBN"},{"value":"1498737153. (electronic bk.)","kind":"ISBN"},{"value":"9781315369532. (electronic bk.)","kind":"ISBN"},{"value":"1315369532. (electronic bk.)","kind":"ISBN"},{"value":"tayfra9781315369532","kind":"OCLC Number"},{"value":"(NhCcYBP)tayfra9781315369532","kind":"OCLC Number"}],"languages":["English"],"links":[{"url":"https://www.taylorfrancis.com/books/9781315369532","kind":"Digital object URL"},{"url":"https://www.taylorfrancis.com/books/9781315369532","kind":"Digital object URL","text":"Taylor & Francis Discovery Collection"}],"literary_form":"Nonfiction","locations":[{"value":"Florida","kind":"Place of Publication"},{"value":"Boca Raton","kind":"Place of Publication"}],"notes":[{"value":["Richard E. Cascarino"],"kind":"Title Statement of Responsibility"},{"value":["\"An Auerbach book.\""],"kind":"General Note"},{"value":["Includes bibliographical references and index"],"kind":"Bibliography Note"},{"value":["Online resource; title from PDF title page (EBSCO, viewed March 23, 2017)"],"kind":"Source of Description Note"}],"physical_description":"1 online resource : illustrations","publishers":[{"name":"CRC Press, Taylor & Francis Group","date":"[2017]","location":"Boca Raton"},{"date":"©20"},{"date":"©2017"}],"related_items":[{"description":"Internal audit and IT audit","relationship":"In Series"}],"subjects":[{"value":["Auditing, Internal"],"kind":"Topical Term"},{"value":["Electronic data processing - Auditing"],"kind":"Topical Term"}],"summary":["Providing a reference guide for IT and Internal Auditors as well as Fraud Examiners, this book presents information written from the practitioner's viewpoint covering not only the need and the theory, but a practical hands-on approach to conducting data analytics. --"],"timdex_provenance":{"source":"alma","run_date":"2026-02-07","run_id":"alma-daily-ingest-2026-02-07t09-21-29","run_record_offset":39970}},"sort":[30.79974,1483228800000]},{"_index":"alma-2025-03-01t03-00-02","_id":"alma:9935113615206761","_score":30.79974,"_source":{"source":"MIT Alma","source_link":"https://mit.primo.exlibrisgroup.com/discovery/fulldisplay?vid=01MIT_INST:MIT&docid=alma9935113615206761","timdex_record_id":"alma:9935113615206761","title":"Data Analytics for Protein Crystallization","call_numbers":["QH506","572.8"],"citation":"Pusey, Marc L, Aygün, Ramazan Savaş (2017): Data Analytics for Protein Crystallization. Cham : Springer International Publishing :. Language material. https://mit.primo.exlibrisgroup.com/discovery/fulldisplay?vid=01MIT_INST:MIT&docid=alma9935113615206761","content_type":["Language material"],"contents":["Introduction to Protein Crystallization","Scoring and Phases of Crystallization","Computational Methods for Protein Crystallization Screening","Robotic Image Acquisition","Classification of Crystallization Trial Images","Crystal Growth Analysis","Focal Stacking for Crystallization Microscopy","Crystal Image Region Segmentation","Visualization","Other Structure Determination Methods","Future of Computational Protein Crystallization"],"contributors":[{"value":"Pusey, Marc L","kind":"author"},{"value":"Aygün, Ramazan Savaş","kind":"author"}],"dates":[{"kind":"Publication date","value":"2017"}],"edition":"1st ed. 2017.","holdings":[{"collection":"Springer Nature - Springer Computer Science eBooks 2017 English International","format":"electronic resource","location":"https://na06.alma.exlibrisgroup.com/view/uresolver/01MIT_INST/openurl?u.ignore_date_coverage=true&portfolio_pid=53690428910006761&Force_direct=true"}],"identifiers":[{"value":"3-319-58937-7","kind":"ISBN"},{"value":"10.1007/978-3-319-58937-4. doi","kind":"Other Identifier"},{"value":"(CKB)4340000000223226","kind":"OCLC Number"},{"value":"(DE-He213)978-3-319-58937-4","kind":"OCLC Number"},{"value":"(MiAaPQ)EBC5163202","kind":"OCLC Number"},{"value":"(PPN)221252045","kind":"OCLC Number"},{"value":"(EXLCZ)994340000000223226","kind":"OCLC Number"}],"languages":["English"],"links":[{"url":"https://na06.alma.exlibrisgroup.com/view/uresolver/01MIT_INST/openurl?u.ignore_date_coverage=true&portfolio_pid=53690428910006761&Force_direct=true","kind":"Digital object URL","text":"Springer Nature - Springer Computer Science eBooks 2017 English International"}],"literary_form":"Nonfiction","locations":[{"value":"Germany","kind":"Place of Publication"},{"value":"Cham","kind":"Place of Publication"}],"notes":[{"value":["by Marc L. Pusey, Ramazan Savaş Aygün"],"kind":"Title Statement of Responsibility"},{"value":["Includes bibliographical references at the end of each chapters and index"],"kind":"Bibliography Note"}],"physical_description":"1 online resource (XX, 231 p. 66 illus., 56 illus. in color.) ","publishers":[{"name":"Springer International Publishing :","date":"2017","location":"Cham"}],"related_items":[{"description":"Computational Biology, 1568-2684 ; 25","relationship":"In Series"}],"subjects":[{"value":["Bioinformatics"],"kind":"Topical Term"},{"value":["Data mining"],"kind":"Topical Term"},{"value":["Optical data processing"],"kind":"Topical Term"},{"value":["Molecular biology"],"kind":"Topical Term"},{"value":["Biotechnology"],"kind":"Topical Term"},{"value":["Computational Biology/Bioinformatics"],"kind":"Topical Term"},{"value":["Data Mining and Knowledge Discovery"],"kind":"Topical Term"},{"value":["Image Processing and Computer Vision"],"kind":"Topical Term"},{"value":["Molecular Medicine"],"kind":"Topical Term"}],"summary":["This unique text/reference presents an overview of the computational aspects of protein crystallization, describing how to build robotic high-throughput and crystallization analysis systems. The coverage encompasses the complete data analysis cycle, including the set-up of screens by analyzing prior crystallization trials, the classification of crystallization trial images by effective feature extraction, the analysis of crystal growth in time series images, the segmentation of crystal regions in images, the application of focal stacking methods for crystallization images, and the visualization of trials. Topics and features: Describes the fundamentals of protein crystallization, and the scoring and categorization of crystallization image trials Introduces a selection of computational methods for protein crystallization screening, and the hardware and software architecture for a basic high-throughput system Presents an overview of the image features used in protein crystallization classification, and a spatio-temporal analysis of protein crystal growth Examines focal stacking techniques to avoid blurred crystallization images, and different thresholding methods for binarization or segmentation Discusses visualization methods and software for protein crystallization analysis, and reviews alternative methods to X-ray diffraction for obtaining structural information Provides an overview of the current challenges and potential future trends in protein crystallization This interdisciplinary work serves as an essential reference on the computational and data analytics components of protein crystallization for the structural biology community, in addition to computer scientists wishing to enter the field of protein crystallization. Dr. Marc L. Pusey is a Research Scientist at iXpressGenes, Inc. Huntsville, AL, USA. Dr. Ramazan Savaş Aygün is an Associate Professor in the Computer Science Department of the University of Alabama in Huntsville, USA."],"timdex_provenance":{"source":"alma","run_date":"2025-02-28","run_id":"alma-full-ingest-2025-02-28t22-33-35","run_record_offset":188688}},"sort":[30.79974,1483228800000]},{"_index":"alma-2025-03-01t03-00-02","_id":"alma:9935092392506761","_score":30.79974,"_source":{"source":"MIT Alma","source_link":"https://mit.primo.exlibrisgroup.com/discovery/fulldisplay?vid=01MIT_INST:MIT&docid=alma9935092392506761","timdex_record_id":"alma:9935092392506761","title":"Data Analytics in Digital Humanities","call_numbers":["QA75.5-76.95","005.7"],"citation":"Data Analytics in Digital Humanities. 2017. Cham : Springer International Publishing :. Language material. https://mit.primo.exlibrisgroup.com/discovery/fulldisplay?vid=01MIT_INST:MIT&docid=alma9935092392506761","content_type":["Language material"],"contents":["Semantic Web for Cultural Heritage Valorization","Using the Formal Representations of Elementary Events to Set Up Computational Models of Full Narratives","Parody Detection: An Annotation, Feature Construction, and Classification Approach to the Web of Parody","Creating and Analyzing Literary Corpora","Content and Sentiment Analysis on Online Social Networks (OSNs)","The Role of Data in Evaluating the Effectiveness of Networked Learning: An Auto-Ethnographic Evaluation of Four Experiential Learning Projects","Psychological Text Analysis in the Digital Humanities","Parsing Related Tags Networks from Flickr to Explore Crowd-Sourced Keyword Associations","A Case Study of Crowdsourcing Imagery Coding in Natural Disasters","YouTube Comments as Metalanguage Data on Non-standard Languages: The Case of Trinidadian Creole English in Soca Music","Creating Inheritable Digital Codebooks for Qualitative Research Data Analysis","Is it Worth It? The Library and Information Science Degree in the Digital Humanities"],"contributors":[{"value":"Hai-Jew, Shalin","kind":"editor"}],"dates":[{"kind":"Publication date","value":"2017"}],"edition":"1st ed. 2017.","holdings":[{"collection":"Springer Nature - Springer Computer Science eBooks 2017 English International","format":"electronic resource","location":"https://na06.alma.exlibrisgroup.com/view/uresolver/01MIT_INST/openurl?u.ignore_date_coverage=true&portfolio_pid=53690453500006761&Force_direct=true"}],"identifiers":[{"value":"3-319-54499-3","kind":"ISBN"},{"value":"10.1007/978-3-319-54499-1. doi","kind":"Other Identifier"},{"value":"(CKB)3710000001307197","kind":"OCLC Number"},{"value":"(DE-He213)978-3-319-54499-1","kind":"OCLC Number"},{"value":"(MiAaPQ)EBC4854498","kind":"OCLC Number"},{"value":"(PPN)20147218X","kind":"OCLC Number"},{"value":"(EXLCZ)993710000001307197","kind":"OCLC Number"}],"languages":["English"],"links":[{"url":"https://na06.alma.exlibrisgroup.com/view/uresolver/01MIT_INST/openurl?u.ignore_date_coverage=true&portfolio_pid=53690453500006761&Force_direct=true","kind":"Digital object URL","text":"Springer Nature - Springer Computer Science eBooks 2017 English International"}],"literary_form":"Nonfiction","locations":[{"value":"Germany","kind":"Place of Publication"},{"value":"Cham","kind":"Place of Publication"}],"notes":[{"value":["edited by Shalin Hai-Jew"],"kind":"Title Statement of Responsibility"},{"value":["Includes bibliographical references at the end of each chapters"],"kind":"Bibliography Note"}],"physical_description":"1 online resource (XXII, 295 p. 37 illus., 23 illus. in color.) ","publishers":[{"name":"Springer International Publishing :","date":"2017","location":"Cham"}],"related_items":[{"description":"Multimedia Systems and Applications","relationship":"In Series"}],"subjects":[{"value":["Computers"],"kind":"Topical Term"},{"value":["Application software"],"kind":"Topical Term"},{"value":["Computer networks"],"kind":"Topical Term"},{"value":["Artificial intelligence"],"kind":"Topical Term"},{"value":["Information Systems and Communication Service"],"kind":"Topical Term"},{"value":["Computer Appl. in Arts and Humanities"],"kind":"Topical Term"},{"value":["Computer Communication Networks"],"kind":"Topical Term"},{"value":["Artificial Intelligence"],"kind":"Topical Term"}],"summary":["This book covers computationally innovative methods and technologies including data collection and elicitation, data processing, data analysis, data visualizations, and data presentation. It explores how digital humanists have harnessed the hypersociality and social technologies, benefited from the open-source sharing not only of data but of code, and made technological capabilities a critical part of humanities work. Chapters are written by researchers from around the world, bringing perspectives from diverse fields and subject areas. The respective authors describe their work, their research, and their learning. Topics include semantic web for cultural heritage valorization, machine learning for parody detection by classification, psychological text analysis, crowdsourcing imagery coding in natural disasters, and creating inheritable digital codebooks. Designed for researchers and academics, this book is suitable for those interested in methodologies and analytics that can be applied in literature, history, philosophy, linguistics, and related disciplines. Professionals such as librarians, archivists, and historians will also find the content informative and instructive. ."],"timdex_provenance":{"source":"alma","run_date":"2025-12-25","run_id":"alma-daily-ingest-2025-12-25t15-32-27","run_record_offset":5110}},"sort":[30.79974,1483228800000]},{"_index":"alma-2025-03-01t03-00-02","_id":"alma:9935985489406761","_score":30.79974,"_source":{"source":"MIT Alma","source_link":"https://mit.primo.exlibrisgroup.com/discovery/fulldisplay?vid=01MIT_INST:MIT&docid=alma9935985489406761","timdex_record_id":"alma:9935985489406761","title":"Data Analytics and Applied Mathematics","citation":"Data Analytics and Applied Mathematics. Malaysia : Universiti Malaysia Pahang Publishing. Language material. https://mit.primo.exlibrisgroup.com/discovery/fulldisplay?vid=01MIT_INST:MIT&docid=alma9935985489406761","content_type":["Language material"],"holdings":[{"collection":"DOAJ Directory of Open Access Journals","format":"electronic resource","location":"https://na06.alma.exlibrisgroup.com/view/uresolver/01MIT_INST/openurl?u.ignore_date_coverage=true&portfolio_pid=53734187800006761&Force_direct=true","note":"Available from 2020 until 2025."}],"identifiers":[{"value":"2773-4854","kind":"ISSN"},{"value":"(CKB)42026147200041","kind":"OCLC Number"},{"value":"(EXLCZ)9942026147200041","kind":"OCLC Number"}],"languages":["English"],"links":[{"url":"https://na06.alma.exlibrisgroup.com/view/uresolver/01MIT_INST/openurl?u.ignore_date_coverage=true&portfolio_pid=53734187800006761&Force_direct=true","kind":"Digital object URL","text":"DOAJ Directory of Open Access Journals"}],"locations":[{"value":"No place, unknown, or undetermined","kind":"Place of Publication"},{"value":"Malaysia","kind":"Place of Publication"}],"publishers":[{"name":"Universiti Malaysia Pahang Publishing","location":"Malaysia"}],"timdex_provenance":{"source":"alma","run_date":"2026-01-04","run_id":"alma-daily-ingest-2026-01-04t09-29-06","run_record_offset":8313}},"sort":[30.79974,-9223372036854775808]},{"_index":"alma-2025-03-01t03-00-02","_id":"alma:9935705173306761","_score":30.580158,"_source":{"source":"MIT Alma","source_link":"https://mit.primo.exlibrisgroup.com/discovery/fulldisplay?vid=01MIT_INST:MIT&docid=alma9935705173306761","timdex_record_id":"alma:9935705173306761","title":"Data Analytics and Machine Learning : Navigating the Big Data Landscape","call_numbers":["QA76.9.Q36","001.422","005.7"],"citation":"Data Analytics and Machine Learning : Navigating the Big Data Landscape. 2024. Singapore : Springer Nature Singapore :. Language material. https://mit.primo.exlibrisgroup.com/discovery/fulldisplay?vid=01MIT_INST:MIT&docid=alma9935705173306761","content_type":["Language material"],"contents":["Chapter 1. Introduction to Data Analytics, Big Data, and Machine Learning","Chapter 2. Fundamentals of Data Analytics and Lifecycle","Chapter 3. Building Predictive Models with Machine Learning","Chapter 4. Stream data model and architecture","Chapter 5. Leveraging Big Data for Data Analytics","Chapter 6. Advanced Techniques in Data Analytics","Chapter 7. Scalable Machine Learning with Big Data","Chapter 8. Big Data Analytics Framework using Machine Learning on Massive Datasets","Chapter 9. Deep-learning Techniques in Big-Data analytics","Chapter 10. Data Privacy and Ethics in Data Analytics","Chapter 11. Practical Implementation of Machine Learning Techniques & data analytics using R","Chapter 12. Real-World Applications of Data Analytics, Big Data, and Machine Learning","Chapter 13. Implementing Data-Driven Innovation in Organizations","Chapter 14. Business Transformation using Big Data Analytics and Machine Learning","Chapter 15. Future Trends and Emerging Opportunities in HealthAnalytics","Chapter 16. Future Trends in Data Analytics and Machine Learning"],"contributors":[{"value":"Singh, Pushpa","kind":"Not specified"},{"value":"Mishra, Asha Rani","kind":"Not specified"},{"value":"Garg, Payal","kind":"Not specified"}],"dates":[{"kind":"Publication date","value":"2024"}],"edition":"1st ed. 2024.","holdings":[{"collection":"SpringerLink Books Mathematics and Statistics","format":"electronic resource","location":"https://na06.alma.exlibrisgroup.com/view/uresolver/01MIT_INST/openurl?u.ignore_date_coverage=true&portfolio_pid=53692170200006761&Force_direct=true"}],"identifiers":[{"value":"9789819704484","kind":"ISBN"},{"value":"9819704480","kind":"ISBN"},{"value":"10.1007/978-981-97-0448-4. doi","kind":"Other Identifier"},{"value":"(MiAaPQ)EBC31221972","kind":"OCLC Number"},{"value":"(Au-PeEL)EBL31221972","kind":"OCLC Number"},{"value":"(DE-He213)978-981-97-0448-4","kind":"OCLC Number"},{"value":"(CKB)30995669800041","kind":"OCLC Number"},{"value":"1427666886","kind":"OCLC Number"},{"value":"(EXLCZ)9930995669800041","kind":"OCLC Number"}],"languages":["English"],"links":[{"url":"https://na06.alma.exlibrisgroup.com/view/uresolver/01MIT_INST/openurl?u.ignore_date_coverage=true&portfolio_pid=53692170200006761&Force_direct=true","kind":"Digital object URL","text":"SpringerLink Books Mathematics and Statistics"}],"literary_form":"Nonfiction","locations":[{"value":"Singapore","kind":"Place of Publication"}],"notes":[{"value":["edited by Pushpa Singh, Asha Rani Mishra, Payal Garg"],"kind":"Title Statement of Responsibility"},{"value":["Description based on publisher supplied metadata and other sources"],"kind":"Source of Description Note"}],"physical_description":"1 online resource (357 pages)","publishers":[{"name":"Springer Nature Singapore :","date":"2024","location":"Singapore"}],"related_items":[{"description":"Studies in Big Data, 2197-6511 ; 145","relationship":"In Series"}],"subjects":[{"value":["Quantitative research"],"kind":"Topical Term"},{"value":["Machine learning"],"kind":"Topical Term"},{"value":["Natural language processing (Computer science)"],"kind":"Topical Term"},{"value":["Data Analysis and Big Data"],"kind":"Topical Term"},{"value":["Machine Learning"],"kind":"Topical Term"},{"value":["Natural Language Processing (NLP)"],"kind":"Topical Term"},{"value":["Dades massives"],"kind":"Topical Term"},{"value":["Aprenentatge automàtic"],"kind":"Topical Term"}],"summary":["This book presents an in-depth analysis of successful data-driven initiatives, highlighting how organizations have leveraged data to drive decision-making processes, optimize operations, and achieve remarkable outcomes. Through case studies, readers gain valuable insights and learn practical strategies for implementing data analytics, big data, and machine learning solutions in their own organizations. The book discusses the transformative power of data analytics and big data in various industries and sectors and how machine learning applications have revolutionized exploration by enabling advanced data analysis techniques for mapping, geospatial analysis, and environmental monitoring, enhancing our understanding of the world and its dynamic processes. This book explores how big data explosion, the power of analytics and machine learning revolution can bring new prospects and opportunities in the dynamic and data-rich landscape. It highlights the future research directions in data analytics, big data, and machine learning that explores the emerging trends, challenges, and opportunities in these fields by covering interdisciplinary approaches such as handling and analyzing real-time and streaming data."],"timdex_provenance":{"source":"alma","run_date":"2026-02-24","run_id":"alma-daily-ingest-2026-02-24t09-21-06","run_record_offset":2713}},"sort":[30.580158,1704067200000]}]},"aggregations":{"places":{"doc_count":1780947,"only_spatial":{"doc_count":147572,"place_names":{"doc_count_error_upper_bound":536,"sum_other_doc_count":126725,"buckets":[{"key":"arctic ocean","doc_count":3374},{"key":"europe","doc_count":3116},{"key":"united states","doc_count":2671},{"key":"massachusetts","doc_count":2390},{"key":"new jersey","doc_count":2083},{"key":"canada","doc_count":1674},{"key":"china","doc_count":1664},{"key":"earth (planet)","doc_count":1452},{"key":"california","doc_count":1346},{"key":"wisconsin","doc_count":1077}]}}},"languages":{"doc_count_error_upper_bound":36,"sum_other_doc_count":6273,"buckets":[{"key":"english","doc_count":282244},{"key":"eng","doc_count":19186},{"key":"en_us","doc_count":10075},{"key":"en","doc_count":7809},{"key":"in english","doc_count":3171},{"key":"german","doc_count":1698},{"key":"french","doc_count":978},{"key":"fra","doc_count":947},{"key":"spanish","doc_count":898},{"key":"russian","doc_count":772}]},"content_type":{"doc_count_error_upper_bound":1,"sum_other_doc_count":15843,"buckets":[{"key":"language material","doc_count":228382},{"key":"polygon data","doc_count":28600},{"key":"article","doc_count":15068},{"key":"image data","doc_count":13247},{"key":"raster data","doc_count":11629},{"key":"thesis","doc_count":11565},{"key":"manuscript language material","doc_count":9646},{"key":"line data","doc_count":8771},{"key":"point data","doc_count":8135},{"key":"not specified","doc_count":5574}]},"subjects":{"doc_count":1780947,"subject_names":{"doc_count_error_upper_bound":6711,"sum_other_doc_count":1598402,"buckets":[{"key":"datasets","doc_count":53692},{"key":"boundaries","doc_count":26136},{"key":"artificial intelligence","doc_count":24242},{"key":"other","doc_count":21480},{"key":"transportation","doc_count":19587},{"key":"society","doc_count":15058},{"key":"united states","doc_count":10086},{"key":"computer networks","doc_count":9451},{"key":"computational intelligence","doc_count":9229},{"key":"oceans","doc_count":9100}]}},"content_format":{"doc_count_error_upper_bound":0,"sum_other_doc_count":173,"buckets":[{"key":"shapefile","doc_count":45170},{"key":"electronic resource","doc_count":34697},{"key":"geotiff","doc_count":14161},{"key":"tiff","doc_count":11827},{"key":"mixed","doc_count":831},{"key":"jpeg","doc_count":340},{"key":"arcgrid","doc_count":266},{"key":"pdf","doc_count":225},{"key":"las","doc_count":148},{"key":"laz","doc_count":103}]},"literary_form":{"doc_count_error_upper_bound":0,"sum_other_doc_count":0,"buckets":[{"key":"nonfiction","doc_count":219030},{"key":"fiction","doc_count":13709}]},"source":{"doc_count_error_upper_bound":0,"sum_other_doc_count":55,"buckets":[{"key":"mit alma","doc_count":245721},{"key":"opengeometadata gis resources","doc_count":73620},{"key":"dspace@mit","doc_count":29210},{"key":"woods hole open access server","doc_count":2994},{"key":"mit gis resources","doc_count":2029},{"key":"zenodo","doc_count":2013},{"key":"mit libraries website","doc_count":225},{"key":"abdul latif jameel poverty action lab dataverse","doc_count":107},{"key":"mit archivesspace","doc_count":105},{"key":"research databases","doc_count":93}]},"contributors":{"doc_count":1236194,"contributor_names":{"doc_count_error_upper_bound":2058,"sum_other_doc_count":1186776,"buckets":[{"key":"national bureau of economic research","doc_count":12657},{"key":"massachusetts institute of technology. department of electrical engineering and computer science","doc_count":6826},{"key":"institute of electrical and electronics engineers","doc_count":4459},{"key":"boundary solutions, inc.","doc_count":4081},{"key":"geological survey (u.s.)","doc_count":4077},{"key":"collins bartholomew ltd","doc_count":3653},{"key":"massachusetts institute of technology. department of physics","doc_count":3589},{"key":"u.s. department of commerce, bureau of the census, geography division","doc_count":3530},{"key":"arctic climate system (acsys)","doc_count":3349},{"key":"international monetary fund","doc_count":3197}]}},"access_to_files":{"doc_count":189972,"only_file_access":{"doc_count":75649,"access_types":{"doc_count_error_upper_bound":0,"sum_other_doc_count":0,"buckets":[{"key":"unknown: check with owning institution","doc_count":73620},{"key":"MIT authentication required","doc_count":1198},{"key":"no authentication required","doc_count":831}]}}}}} + recorded_at: Tue, 28 Apr 2026 20:49:13 GMT +recorded_with: VCR 6.4.0 diff --git a/test/vcr_cassettes/graphql_search_data_analytics_semantic.yml b/test/vcr_cassettes/graphql_search_data_analytics_semantic.yml new file mode 100644 index 00000000..09e7511a --- /dev/null +++ b/test/vcr_cassettes/graphql_search_data_analytics_semantic.yml @@ -0,0 +1,107 @@ +--- +http_interactions: +- request: + method: post + uri: http://localhost:9200/2015-03-31/functions/timdex-semantic-builder-prod:live/invocations + body: + encoding: UTF-8 + string: '{"query":"data analytics"}' + headers: + Accept-Encoding: + - '' + Amz-Sdk-Invocation-Id: + - 4a482ef1-b42f-4ba5-83c0-05202d742cb7 + X-Amz-Invocation-Type: + - RequestResponse + Content-Type: + - application/octet-stream + Host: + - localhost:9200 + X-Amz-Date: + - 20260430T224737Z + X-Amz-Content-Sha256: + - "" + Authorization: + - "" + User-Agent: + - aws-sdk-ruby3/3.244.0 ua/2.1 api/lambda#1.177.0 os/macos#25 md/arm64 lang/ruby#3.4.9 + md/3.4.9 m/Z,b,D,n + Content-Length: + - '26' + Accept: + - "*/*" + response: + status: + code: 200 + message: OK + headers: + Date: + - Thu, 30 Apr 2026 22:47:37 GMT + Content-Type: + - application/json + Content-Length: + - '360' + Connection: + - keep-alive + X-Amzn-Requestid: + - 0bc77ad7-4cfb-4942-b62e-f149ba06f32c + X-Amzn-Remapped-Content-Length: + - '0' + X-Amz-Executed-Version: + - '2' + X-Amzn-Trace-Id: + - Root=1-69f3dc09-64c77dfd369f5871491a1d56;Parent=27260d29f18ac71f;Sampled=0;Lineage=1:75f47734:0 + body: + encoding: UTF-8 + string: '{"query": {"bool": {"should": [{"rank_feature": {"field": "embedding_full_record.[CLS]", + "boost": 1.0}}, {"rank_feature": {"field": "embedding_full_record.[SEP]", + "boost": 1.0}}, {"rank_feature": {"field": "embedding_full_record.data", "boost": + 3.960404872894287}}, {"rank_feature": {"field": "embedding_full_record.analytics", + "boost": 7.998181343078613}}]}}}' + recorded_at: Thu, 30 Apr 2026 22:47:37 GMT +- request: + method: post + uri: http://localhost:9200/all-current/_search + body: + encoding: UTF-8 + string: '{"from":"0","size":20,"query":{"bool":{"should":[{"rank_feature":{"field":"embedding_full_record.[CLS]","boost":1.0}},{"rank_feature":{"field":"embedding_full_record.[SEP]","boost":1.0}},{"rank_feature":{"field":"embedding_full_record.data","boost":3.960404872894287}},{"rank_feature":{"field":"embedding_full_record.analytics","boost":7.998181343078613}}]}},"aggregations":{"access_to_files":{"nested":{"path":"rights"},"aggs":{"only_file_access":{"filter":{"terms":{"rights.kind":["Access + to files"]}},"aggs":{"access_types":{"terms":{"field":"rights.description.keyword"}}}}}},"contributors":{"nested":{"path":"contributors"},"aggs":{"contributor_names":{"terms":{"field":"contributors.value.keyword"}}}},"content_type":{"terms":{"field":"content_type"}},"content_format":{"terms":{"field":"format"}},"languages":{"terms":{"field":"languages.keyword"}},"literary_form":{"terms":{"field":"literary_form"}},"places":{"nested":{"path":"subjects"},"aggs":{"only_spatial":{"filter":{"terms":{"subjects.kind":["Dublin + Core; Spatial"]}},"aggs":{"place_names":{"terms":{"field":"subjects.value.keyword"}}}}}},"source":{"terms":{"field":"source"}},"subjects":{"nested":{"path":"subjects"},"aggs":{"subject_names":{"terms":{"field":"subjects.value.keyword"}}}}},"sort":[{"_score":{"order":"desc"}},{"dates.value.as_date":{"order":"desc","nested":{"path":"dates"}}}]}' + headers: + User-Agent: + - 'opensearch-ruby/3.4.0 (RUBY_VERSION: 3.4.9; darwin arm64; Faraday v2.14.0)' + Content-Type: + - application/json + Host: + - localhost:9200 + X-Amz-Date: + - 20260430T224737Z + X-Amz-Content-Sha256: + - "" + Authorization: + - "" + Accept-Encoding: + - gzip;q=1.0,deflate;q=0.6,identity;q=0.3 + Accept: + - "*/*" + response: + status: + code: 200 + message: OK + headers: + Date: + - Thu, 30 Apr 2026 22:47:38 GMT + Content-Type: + - application/json; charset=UTF-8 + Content-Length: + - '288019' + Connection: + - keep-alive + Access-Control-Allow-Origin: + - "*" + body: + encoding: ASCII-8BIT + string: !binary |- + {"took":113,"timed_out":false,"_shards":{"total":23,"successful":23,"skipped":0,"failed":0},"hits":{"total":{"value":2662,"relation":"eq"},"max_score":null,"hits":[{"_index":"dspace-2026-02-09t19-23-02","_id":"dspace:1721.1-165085","_score":10.457806,"_source":{"summary":["In the National Basketball Association (NBA), basketball data and analytics is an area of significant financial investment for all 30 franchises, despite there being little quantitative evidence demonstrating analytics adoption actually improves team-level performance. This study seeks to measure the return on investment of analytics on NBA team success in a time of great demand for analytical front office personnel. Using a two-way fixed effects modeling approach, we identify the causal effect of analytics department headcounts on regular season wins using 12 years of season-level data for each team. We find a positive and statistically significant effect, suggesting clubs that invest more in analytics tend to outperform competitors when controlling for roster characteristics, injuries, difficulty of schedule, and team-specific and time-specific effects. This research contributes to the body of literature affirming the value of data analytics for organizational performance and supports current investments in analytics being made by NBA teams."],"timdex_provenance":{"source":"dspace","run_date":"2026-03-13","run_id":"60d21b85-30e5-5480-337b-fd30321c6b6c_8bac6d5e-afd5-2dc4-a025-094f50ff17bd","run_record_offset":28},"languages":["en"],"citation":"Wang, H., Sarker, A., & Hosoi, A. (2025). The Effect of Basketball Analytics Investment on National Basketball Association (NBA) Team Performance. Journal of Sports Economics, 26(6), 668-688.","file_formats":["application/pdf"],"identifiers":[{"value":"https://hdl.handle.net/1721.1/165085","kind":"uri"}],"format":"electronic resource","embedding_full_record":{"authored":0.00483300443738699,"rebounds":0.003792762290686369,"inform":0.005033987108618021,"##ker":0.32739731669425964,"##i":0.1980927288532257,"analyzing":0.2434443086385727,"competitors":0.19835051894187927,"stats":0.32522857189178467,"##ette":0.2618180811405182,"record":0.14649361371994019,"championship":0.08970509469509125,"##x":0.24548254907131195,"investing":0.30400145053863525,"injury":0.24254153668880463,"publishing":0.23609288036823273,"wins":0.33941397070884705,"organizational":0.32620757818222046,"models":0.17696574330329895,"using":0.023564882576465607,"af":0.11762866377830505,"impact":0.3405466675758362,"league":0.15658791363239288,"investment":0.6186730265617371,"engineers":0.07053177058696747,"economy":0.1287858635187149,"analysis":0.5486773252487183,"##basket":0.03727962076663971,"demand":0.004965230356901884,"ar":0.1623823195695877,"wang":0.4013051688671112,"correlation":0.0702986791729927,"adopt":0.02458050474524498,"institute":0.34670737385749817,"returns":0.14239034056663513,"competitive":0.0871296375989914,"invested":0.197487473487854,"object":0.12123031914234161,"boston":0.16704927384853363,"statistical":0.33870911598205566,"nets":0.06507312506437302,"affect":0.28550124168395996,"cited":0.2414742410182953,"association":0.13781724870204926,"##ettes":0.0640859454870224,"proven":0.2889358699321747,"investments":0.33833828568458557,"##des":0.162139430642128,"measurement":0.013262741267681122,"worth":0.029773883521556854,"roster":0.24813212454319,"journal":0.4408372938632965,"citations":0.31905561685562134,"adoption":0.3094046115875244,"does":0.07218693941831589,"mit":0.47608017921447754,"national":0.19127292931079865,"departments":0.15151198208332062,"relationship":0.020197395235300064,"##ded":0.012439455837011337,"stat":0.27374452352523804,"mechanics":0.02505243755877018,"team":0.5648559331893921,"dept":0.16022242605686188,"fiba":0.13642051815986633,"cavaliers":0.009747179225087166,"metric":0.2429439127445221,"##ance":0.26810869574546814,"analytic":0.4726637601852417,"adopted":0.10728978365659714,"publications":0.24129238724708557,"evidence":0.16222333908081055,"##mer":0.1342613250017166,"invest":0.39057818055152893,"nationals":0.10913808643817902,"organisation":0.07676558196544647,"run":0.22440651059150696,"source":0.1683836579322815,"do":0.05590168386697769,"##pers":0.07759539783000946,"research":0.39885565638542175,"ds":0.5476102828979492,"##21":0.17087087035179138,"analytics":0.7221149802207947,"club":0.12472434341907501,"scheduling":0.03523804992437363,"tim":0.46858692169189453,"ur":0.12057366967201233,"tech":0.10767471790313721,"mlb":0.014444065280258656,"ncaa":0.27180495858192444,"nielsen":0.1453147828578949,"engineering":0.23316705226898193,"significant":0.23159800469875336,"##so":0.34595298767089844,"article":0.18896609544754028,"improving":0.1595272570848465,"measure":0.23048138618469238,"spending":0.11690328270196915,"success":0.4059431850910187,"citing":0.12620405852794647,"fixed":0.3266894817352295,"66":0.03817429021000862,"analysts":0.24936729669570923,"formats":0.03084426186978817,"analytical":0.476420521736145,"sources":0.027622273191809654,"records":0.012865365482866764,"importance":0.0050969794392585754,"mass":0.2508464753627777,"standings":0.03871286287903786,"content":0.059414591640233994,"society":0.13153338432312012,"authorship":0.023647533729672432,"causal":0.17696064710617065,"##co":0.11776603758335114,"performances":0.1789798140525818,"pixel":0.05160589888691902,"turnover":0.051276449114084244,"successful":0.09099702537059784,"##com":0.038724385201931,"digital":0.19032178819179535,"effectiveness":0.10742103308439255,"winning":0.02885136380791664,"citation":0.3753284811973572,"org":0.020824342966079712,"perform":0.09498482197523117,"affects":0.05750870704650879,"technology":0.14464010298252106,"improvement":0.14622284471988678,"engineer":0.03111451491713524,"##de":0.5359204411506653,"henry":0.2243817299604416,"schedule":0.042090680450201035,"1721":0.3152943551540375,"pdf":0.07503391802310944,"regression":0.13188129663467407,"publish":0.16642363369464874,"analyst":0.3845071792602539,"personnel":0.16422149538993835,"contributors":0.139948308467865,"articles":0.06910190731287003,"finance":0.040714677423238754,"college":0.1119426041841507,"basket":0.14207886159420013,"measured":0.11666429042816162,"modeling":0.25303319096565247,"espn":0.07067327201366425,"ho":0.33020952343940735,"improves":0.10071452707052231,"mechanical":0.1229412853717804,"competition":0.06431739032268524,"zhang":0.11683424562215805,"tracking":0.14748187363147736,"approach":0.1432684063911438,"##vs":0.11007469147443771,"improved":0.2227373868227005,"measures":0.10443554073572159,"##ifier":0.011315791867673397,"massachusetts":0.5193345546722412,"model":0.23153436183929443,"id":0.2684827446937561,"efficiency":0.08015455305576324,"teams":0.3874035179615021,"ahl":0.005403110757470131,"players":0.08680970966815948,"impacts":0.19381672143936157,"##tech":3.121751651633531E-4,"nba":0.9368412494659424,"journals":0.15051427483558655,"intelligence":0.012308428063988686,"knicks":0.06064468249678612,"issn":0.006873367354273796,"anal":0.31847840547561646,"analyze":0.23099017143249512,"nbl":0.0371711365878582,"baseball":0.08230888843536377,"athletic":0.20476317405700684,"valuable":0.012511027976870537,"participation":2.2666338190902025E-4,"study":0.22262078523635864,"##per":0.23226282000541687,"##85":0.14415298402309418,"commons":0.1896585375070572,"rebound":0.11439929157495499,"electronic":0.08433806896209717,"regular":0.1293708235025406,"wnba":0.5108566284179688,"hockey":0.17532771825790405,"##bution":0.07312816381454468,"quan":0.05327353626489639,"##unt":0.21827930212020874,"positive":0.2560640275478363,"organization":0.2822425365447998,"cite":0.30610477924346924,"heads":0.11880984157323837,"economic":0.3363702595233917,"return":0.2750019133090973,"statistics":0.43932417035102844,"date":0.10210921615362167,"franchise":0.23302961885929108,"data":0.778795599937439,"injuries":0.08149801939725876,"use":0.09920882433652878,"office":0.1009049043059349,"space":0.11342091858386993,"influence":0.12401829659938812,"eco":0.09726429730653763,"basketball":0.8264750242233276,"publication":0.3438825011253357,"1650":0.12534485757350922,"implemented":0.006973759271204472,"sage":0.4516873359680176,"publishers":0.0948072001338005,"orlando":0.08646208792924881,"##ix":0.014596574008464813,"franchises":0.25198060274124146,"offset":0.37255364656448364,"resource":0.21287602186203003,"level":0.17145605385303497,"insights":0.021293707191944122,"kind":0.047965455800294876,"author":0.004397143144160509,"##pace":0.4581374526023865,"format":0.11830489337444305,"published":0.2723352015018463,"affected":0.15012627840042114,"rankings":0.185667023062706,"effects":0.5306780934333801,"efforts":0.06826064735651016,"##pro":0.11588629335165024,"202":0.20829176902770996,"improve":0.3048801124095917,"effect":0.5868650078773499,"publisher":0.18286298215389252,"harvard":0.1313050389289856,"referees":0.003372898092493415,"##tiv":0.09576403349637985,"game":0.06411959230899811,"lakers":0.1728333830833435,"##duction":0.2513018846511841,"ns":0.06308557838201523,"university":0.22075267136096954,"financial":0.17525207996368408,"##ducted":0.016475463286042213,"values":0.04902276396751404,"link":0.0030865436419844627,"lineup":0.10249074548482895,"why":0.02282966673374176,"roi":0.21678435802459717,"head":0.3269246220588684,"effective":0.1750311404466629,"database":0.01761605404317379,"contributor":0.0653209239244461,"##5":0.013814386911690235,"competitor":0.07544703036546707,"spend":0.20643791556358337,"clubs":0.06666307151317596,"studies":0.061681363731622696,"department":0.33980754017829895,"value":0.5909327864646912,"win":0.18458160758018494,"tufts":0.008202028460800648,"economists":0.05749127268791199,"##ass":0.05592064559459686,"soccer":0.15778614580631256,"economist":0.23242071270942688,"sports":0.5444217324256897,"sar":0.4443624019622803,"performing":0.06993822753429413,"implementation":0.028237806633114815,"resources":0.10146132111549377,"approaches":0.06401660293340683,"specific":0.07001840323209763,"economics":0.42911845445632935,"investor":0.06469711661338806,"performance":0.5796993970870972,"nhl":0.191616952419281,"quantitative":0.24829912185668945,"variable":0.030324427410960197,"organizations":0.012352881021797657,"front":0.1863066703081131,"sport":0.3994569182395935,"timothy":0.07230345904827118},"dates":[{"kind":"Publication date","value":"2025-08"}],"source":"DSpace@MIT","title":"The Effect of Basketball Analytics Investment on National Basketball Association (NBA) Team Performance","related_items":[{"description":"Journal of Sports Economics","relationship":"host"}],"source_link":"https://dspace.mit.edu/handle/1721.1/165085","content_type":["Article"],"rights":[{"description":"Creative Commons Attribution-Noncommercial","kind":"useAndReproduction"}],"publishers":[{"name":"SAGE Publications"}],"links":[{"url":"https://hdl.handle.net/1721.1/165085","kind":"Digital object URL","text":"Digital object URL"}],"contributors":[{"value":"Wang, Henry","kind":"author"},{"value":"Sarker, Arnab","kind":"author"},{"value":"Hosoi, Anette","kind":"author"},{"value":"Massachusetts Institute of Technology. Institute for Data, Systems, and Society","kind":"department"},{"value":"Massachusetts Institute of Technology. Department of Mechanical Engineering","kind":"department"}],"timdex_record_id":"dspace:1721.1-165085"},"sort":[10.457806,1754006400000]},{"_index":"dspace-2026-02-09t19-23-02","_id":"dspace:1721.1-162833","_score":10.443916,"_source":{"summary":["What-if analysis (WIA) is essential for data-driven decision-making, allowing users to assess how changes in variables impact outcomes and explore alternative scenarios. Existing WIA research primarily supports the workflows of data scientists and analysts, and largely overlooks business professionals who engage in WIA through non-technical means. To bridge this gap, we conduct a two-part user study with 22 business professionals across marketing, sales, product, and operations roles. The first study examines their existing WIA practices, tools, and challenges. Findings reveal that business professionals perform many WIA techniques independently using rudimentary tools due to various constraints. We then implement representative WIA techniques in a visual analytics prototype and use it as a probe to conduct a follow-up study evaluating business professionals’ practical use of the techniques. Results show that these techniques improve decision-making efficiency and confidence while underscoring the need for better support in data preparation, risk assessment, and domain knowledge integration. Finally, we offer design recommendations to enhance future business analytics systems."],"timdex_provenance":{"source":"dspace","run_date":"2026-04-15","run_id":"a816f3dc-51ac-7e5f-cec8-1086ffc54274_861de409-c771-2e2c-c416-93c81a0885e3","run_record_offset":179},"languages":["en"],"citation":"Sneha Gathani, Zhicheng Liu, Peter J. Haas, and Çağatay Demiralp. 2025. What-if Analysis for Business Professionals: Current Practices and Future Opportunities. In Proceedings of the 2025 CHI Conference on Human Factors in Computing Systems (CHI '25). Association for Computing Machinery, New York, NY, USA, Article 973, 1–17.","file_formats":["application/pdf"],"identifiers":[{"value":"979-8-4007-1394-1","kind":"isbn"},{"value":"https://hdl.handle.net/1721.1/162833","kind":"uri"},{"value":"PUBLISHER_POLICY","kind":"mitlicense"}],"format":"electronic resource","embedding_full_record":{"authored":0.05191252753138542,"##a":1.0027642250061035,"inform":0.029083512723445892,"prototypes":0.21854248642921448,"##ne":0.34707143902778625,"##g":0.018550541251897812,"##i":0.2105436772108078,"scenarios":0.23109446465969086,"##m":0.2472834438085556,"constraints":0.17049647867679596,"professional":0.5031987428665161,"analyzing":0.31838998198509216,"evaluation":0.12601420283317566,"##p":0.09605764597654343,"contribution":0.007430742494761944,"outcomes":0.1648963838815689,"record":0.09035652130842209,"##ancy":0.004478675778955221,"##x":0.12095870822668076,"visual":0.25518304109573364,"##ances":0.012812867760658264,"publishing":0.2174195498228073,"meeting":0.026077469810843468,"knowledge":0.33276623487472534,"##diment":0.2506369650363922,"ac":0.3116277754306793,"using":0.009080130606889725,"impact":0.009445489384233952,"ai":0.390805184841156,"opportunity":0.35829856991767883,"analysis":0.7002549767494202,"-":0.5897051692008972,"domain":0.39626672863960266,"science":0.16306333243846893,"institute":0.294184148311615,"evaluating":0.009789041243493557,"firms":0.06488903611898422,"agile":0.03639747574925423,"object":0.137034609913826,"boston":0.07730861008167267,"statistical":0.25293007493019104,"25":0.538654625415802,"conference":0.51813805103302,"##ral":0.2653306722640991,"independent":0.03199983388185501,"association":0.2707478404045105,"cited":0.2047041356563568,"proven":0.25799131393432617,"current":0.31249332427978516,"citations":0.2708944082260132,"journal":0.15914076566696167,"systems":0.22397150099277496,"scenario":0.15866699814796448,"peter":0.14899370074272156,"audit":0.09467830508947372,"139":0.12069577723741531,"##flow":0.183265820145607,"mit":0.5662500262260437,"wikipedia":0.15268084406852722,"seo":0.049579720944166183,"u2":0.006020034663379192,"computers":0.18979142606258392,"conferences":0.1843430995941162,"email":0.018208639696240425,"policy":0.14327730238437653,"variables":0.2030119150876999,"business":0.7641991972923279,"decision":0.450635701417923,"languages":0.1329067200422287,"strategies":0.048894643783569336,"consulting":0.09751559793949127,"maker":0.06228049099445343,"j":0.05389202758669853,"practices":0.415806382894516,"##01":0.3468054533004761,"marketing":0.2826179563999176,"consultant":0.02450939640402794,"ibm":0.10680146515369415,"metric":0.0418231338262558,"z":0.33311793208122253,"##ance":0.31156492233276367,"analytic":0.27576497197151184,"essential":0.39925244450569153,"publications":0.1327870935201645,"performs":0.03832448273897171,"##as":0.3751745820045471,"engagement":0.11762499064207077,"##ay":0.0967610701918602,"project":0.005974237807095051,"language":0.17219512164592743,"run":0.16684575378894806,"source":0.1372843086719513,"research":0.5320663452148438,"ds":0.45649129152297974,"ata":0.35058626532554626,"##21":0.014081788249313831,"analytics":0.4742554724216461,"##aa":0.3309778869152069,"assessment":0.32205209136009216,"##16":0.10311861336231232,"##ai":0.033662669360637665,"tim":0.4088604748249054,"liu":0.3322962820529938,"implement":0.1529620885848999,"cambridge":0.03857250511646271,"ict":0.11336133629083633,"ur":0.12308906018733978,"results":0.06998555362224579,"computational":0.09694395959377289,"tech":0.04912598058581352,"making":0.18895307183265686,"zen":0.028141532093286514,"chi":0.5461336374282837,"solutions":0.05720190331339836,"pro":0.09123106300830841,"##anal":0.08108075708150864,"users":0.27661722898483276,"article":0.20947150886058807,"##32":0.03605867549777031,"technologies":0.08686001598834991,"##25":0.25831660628318787,"laboratory":0.13162736594676971,"citing":0.07833412289619446,"support":0.11836963891983032,"useful":0.05237974226474762,"analysts":0.35668832063674927,"formats":0.08756514638662338,"analytical":0.3124907612800598,"technical":0.25080201029777527,"scientist":0.14821840822696686,"prospects":0.057297393679618835,"mass":0.15411165356636047,"isbn":0.1309003084897995,"title":0.10061553120613098,"papers":0.00335139618255198,"content":0.06880553811788559,"##33":0.2266327142715454,"symposium":0.11593673378229141,"##34":0.05751659348607063,"wi":0.9889600276947021,"179":0.025863630697131157,"authorship":0.056988127529621124,"ga":0.320101261138916,"haas":0.485280305147171,"1717":0.01744004897773266,"factor":0.4462113380432129,"##hic":0.2467958778142929,"human":0.5113061666488647,"reporting":0.0018579547759145498,"digital":0.2638869881629944,"wisconsin":0.2615967094898224,"convention":0.08451136201620102,"summary":0.05320945009589195,"practical":0.1873079538345337,"citation":0.3520885407924652,"perform":0.16486212611198425,"technology":0.18681007623672485,"futures":0.21160642802715302,"improvement":0.01718677394092083,"##de":0.3302842378616333,"existing":0.10321980714797974,"1722":0.06332427263259888,"artificial":0.4514016807079315,"1721":0.3791588544845581,"what":0.2329787164926529,"pdf":0.22011995315551758,"2015":0.024042215198278427,"management":0.003898275550454855,"regression":0.08102430403232574,"publish":0.1644141674041748,"analyst":0.3620862662792206,"risk":0.24512092769145966,"contributors":0.11170214414596558,"articles":0.07271508872509003,"humans":0.03288916125893593,"practice":0.3615918457508087,"modeling":0.07830069214105606,"software":0.09446679055690765,"hr":0.1692289412021637,"zhang":0.10025336593389511,"approach":0.08446476608514786,"preparation":0.11319591104984283,"improved":0.05897941067814827,"##ifier":0.022686123847961426,"massachusetts":0.5117567181587219,"proceedings":0.28894752264022827,"id":0.16295357048511505,"1618":0.0909525603055954,"if":1.2448915243148804,"businesses":0.2775430679321289,"97":0.0745692104101181,"##nse":0.05948706716299057,"algorithm":0.10298531502485275,"profession":0.11282175779342651,"efficiency":0.2354254573583603,"##wi":0.1365964263677597,"method":0.13638533651828766,"##lice":0.10936585813760757,"handle":0.04463567957282066,"##tech":0.031338125467300415,"intel":0.02773711457848549,"creative":0.07104255259037018,"intelligence":0.3849372863769531,"1624":0.013055210933089256,"practitioners":0.2064058780670166,"system":0.16150689125061035,"anal":0.2684856057167053,"analyze":0.2688952088356018,"driven":0.3371671438217163,"integration":0.22398848831653595,"1628":0.3145601451396942,"machinery":0.25017011165618896,"authors":0.08048336952924728,"algorithms":0.0664784163236618,"study":0.27611052989959717,"methods":0.18959590792655945,"##fat":0.12349352985620499,"professions":0.10403122007846832,"##ha":0.32250362634658813,"1086":0.019704598933458328,"tools":0.3516285717487335,"commons":0.21807773411273956,"##hen":0.24843475222587585,"computer":0.40113702416419983,"file":0.08762799203395844,"1632":0.05831776559352875,"rights":0.049999650567770004,"electronic":0.16005150973796844,"decisions":0.2508869171142578,"imperative":0.05929991230368614,"outcome":0.06795349717140198,"product":0.10073764622211456,"##bution":0.03400857374072075,"efficient":0.0272274911403656,"topics":0.08242319524288177,"implementing":0.05440111458301544,"techno":0.0025340120773762465,"##if":0.560657799243927,"opportunities":0.31559762358665466,"prototype":0.28409579396247864,"mba":0.093415766954422,"framework":0.12693873047828674,"assess":0.13614758849143982,"future":0.5342420339584351,"machine":0.156990185379982,"cite":0.2907610833644867,"constraint":0.047468751668930054,"statistics":0.16368265450000763,"date":0.13735339045524597,"data":0.5884782671928406,"use":0.11631139367818832,"prepared":0.023985303938388824,"findings":0.07109513878822327,"lab":0.05085355415940285,"sales":0.1477455049753189,"space":0.10278099030256271,"cloud":0.05310815945267677,"[SEP]":0.7035151720046997,"ma":0.13242633640766144,"publication":0.3809087574481964,"implemented":0.14669254422187805,"publishers":0.10212524235248566,"potential":0.08712512254714966,"representative":0.03368213772773743,"offset":0.3483330011367798,"resource":0.2347545474767685,"insights":0.004414400551468134,"author":0.12266872823238373,"kind":0.08087065070867538,"##pace":0.46121227741241455,"format":0.2043294608592987,"domains":0.18895724415779114,"published":0.29758787155151367,"tool":0.3202323913574219,"license":0.012752658687531948,"##pro":0.16157326102256775,"202":0.2806169092655182,"scientists":0.17539474368095398,"techniques":0.4296042323112488,"improve":0.17039155960083008,"publisher":0.22064021229743958,"topic":0.0615447536110878,"harvard":0.12835632264614105,"code":0.08719901740550995,"##duction":0.2882821261882782,"challenges":0.20127509534358978,"purpose":0.033406488597393036,"university":0.150497704744339,"professionals":0.4937039613723755,"technique":0.32183340191841125,"ny":0.10452629625797272,"computing":0.420647531747818,"database":0.16211634874343872,"operations":0.17537201941013336,"contributor":0.009288248606026173,"paper":0.04378176108002663,"##5":0.3104284703731537,"studies":0.14025089144706726,"##than":0.3172648251056671,"department":0.05544678866863251,"value":0.5170698165893555,"on":0.28628411889076233,"25th":0.08428943157196045,"assessments":0.10193905234336853,"sap":0.04737306758761406,"implementation":0.22245781123638153,"confidence":0.2130860537290573,"alternative":0.027048248797655106,"resources":0.13590683043003082,"approaches":0.151011660695076,"factors":0.6206023097038269,"probe":0.32873663306236267,"cyber":0.02938186563551426,"demi":0.43219703435897827,"performance":0.03776451200246811,"##tha":0.02196970209479332,"application":0.10478946566581726,"engage":0.09700187295675278,"york":0.23773902654647827,"variable":0.20153282582759857,"challenge":0.11086766421794891,"independently":0.03500847890973091,"wireless":0.0839691236615181,"machines":0.09642960876226425,"strategy":0.07080487906932831,"user":0.16414625942707062,"hypothesis":0.04968912899494171,"methodology":0.21711790561676025},"dates":[{"kind":"Publication date","value":"2025-04-25"}],"source":"DSpace@MIT","title":"What-if Analysis for Business Professionals: Current Practices and Future Opportunities","source_link":"https://dspace.mit.edu/handle/1721.1/162833","content_type":["Article"],"rights":[{"description":"Creative Commons Attribution","kind":"useAndReproduction"}],"publishers":[{"name":"ACM|CHI Conference on Human Factors in Computing Systems"}],"links":[{"url":"https://hdl.handle.net/1721.1/162833","kind":"Digital object URL","text":"Digital object URL"}],"contributors":[{"value":"Gathani, Sneha","kind":"author"},{"value":"Liu, Zhicheng","kind":"author"},{"value":"Haas, Peter J.","kind":"author"},{"value":"Demiralp, ?a?atay","kind":"author"},{"value":"Massachusetts Institute of Technology. Computer Science and Artificial Intelligence Laboratory","kind":"department"}],"timdex_record_id":"dspace:1721.1-162833"},"sort":[10.443916,1745539200000]},{"_index":"mitlibwebsite-2026-02-12t15-43-22","_id":"mitlibwebsite:99bb2005eab80d9b7a387d2f931da7e4","_score":10.389838,"_source":{"source":"MIT Libraries Website","source_link":"https://libraries.mit.edu/news/quick-dirty-data-management-the-5-things-you-should-absolutely-be-doing-with-your-data-now-6/44162/","timdex_record_id":"mitlibwebsite:99bb2005eab80d9b7a387d2f931da7e4","title":"Quick & dirty data management: the 5 things you should absolutely be doing with your data now | News","citation":"MIT Libraries. Quick & dirty data management: the 5 things you should absolutely be doing with your data now | News. Website. https://libraries.mit.edu/news/quick-dirty-data-management-the-5-things-you-should-absolutely-be-doing-with-your-data-now-6/44162/","content_type":["Website"],"contributors":[{"value":"MIT Libraries","kind":"creator","mit_affiliated":true}],"dates":[{"kind":"Accessed","value":"2026-04-01T23:03:33.306111+00:00"}],"format":"electronic resource","fulltext":"Quick & dirty data management: the 5 things you should absolutely be doing with your data now By Brigham Fay on March 17, 2026 in Data Event date April 10, 2026 01:00 PM\t\t\t-\t\t\t02:00 PM For more about this event, please visit https://calendar.mit.edu/event/quick-dirty-data-management-the-5-things-you-should-absolutely-be-doing-with-your-data-now-3950","links":[{"url":"https://libraries.mit.edu/news/quick-dirty-data-management-the-5-things-you-should-absolutely-be-doing-with-your-data-now-6/44162/","kind":"Website"}],"timdex_provenance":{"source":"mitlibwebsite","run_date":"2026-04-01","run_id":"ccead835-7bed-7a69-f289-8e038c5963dc_222f0b97-3cb4-7b75-be5b-fc6876122bf9","run_record_offset":27},"embedding_full_record":{"04":0.031054982915520668,"your":0.2677822411060333,"password":0.04484247416257858,"##hot":0.02797878161072731,"##u":0.09627774357795715,"record":0.2706662118434906,"##x":0.2172762006521225,"api":0.10560024529695511,"events":0.13162025809288025,"you":0.09163212031126022,"databases":0.0674922913312912,"using":0.16574402153491974,"#":0.06573346257209778,"&":0.20999941229820251,"17":0.057539187371730804,"-":0.006797522306442261,"version":0.0013726266333833337,"something":0.0572061687707901,"5":0.6789326071739197,"domain":0.044723693281412125,"institute":0.1343909651041031,"referencing":1.7032105824910104E-4,"archives":0.09791985154151917,"statistical":0.06467604637145996,"be":0.25038662552833557,"access":0.03914772346615791,"cited":0.2797781229019165,"proven":0.19715192914009094,"##des":0.07569538056850433,"posted":0.0019136941991746426,"##text":0.06787291169166565,"how":0.01724790222942829,"citations":0.3241134285926819,"journal":0.018506553024053574,"managed":0.13973921537399292,"mit":0.7194049954414368,"wikipedia":0.11997506022453308,"##ded":0.01866740733385086,"_":0.1104559674859047,"dirty":0.5896445512771606,"calendar":0.18462851643562317,"cc":0.10637160390615463,"website":0.4394506514072418,"manager":0.2524646520614624,"quicker":0.01677314192056656,"librarian":0.30234116315841675,"march":0.19389067590236664,"fast":0.2021806538105011,"absolute":0.3065606653690338,"information":0.20274342596530914,"##ance":0.2803010046482086,"thing":0.19754312932491302,"db":0.17882224917411804,"44":0.020413050428032875,"administration":0.005922554060816765,"rapid":0.020889487117528915,"project":0.06108800694346428,"run":0.29577115178108215,"sites":0.03054068237543106,"retrieved":0.019089028239250183,"source":0.36868295073509216,"do":0.01725970394909382,"research":0.1549757570028305,"395":0.17727793753147125,"analytics":0.14944222569465637,"apache":0.029748978093266487,"affiliation":0.1206887736916542,"things":0.3904760181903839,"tim":0.4819258749485016,"five":0.5238211750984192,"ur":0.21953824162483215,"ed":0.14392277598381042,"info":0.12785564363002777,"campus":0.02344180829823017,"wrote":0.0312606543302536,"garbage":0.0610080249607563,"collection":0.015555204823613167,"##cb":0.027507854625582695,"institutional":0.0020690294913947582,"citing":0.20417791604995728,"page":0.032129861414432526,"doing":0.46381354331970215,"sources":0.12393900752067566,"brigham":0.4254595637321472,"records":0.10338225960731506,"##ete":0.019120238721370697,"update":0.03103329986333847,"title":0.09214888513088226,"##da":0.006608607247471809,"content":0.10805842280387878,"symposium":0.11033401638269424,"sourced":0.07824677973985672,"##38":0.07485401630401611,"authorship":0.009064335376024246,"now":0.5294740796089172,"news":0.4606345295906067,"citation":0.4037435054779053,"org":0.07926895469427109,"libraries":0.5318983793258667,"manage":0.12658393383026123,"##de":0.480607807636261,"with":0.3667549192905426,"management":0.5819224715232849,"referenced":0.015496164560317993,"contributors":0.09125857800245285,"byu":0.3176669776439667,"college":0.05177845433354378,"copyright":0.12986385822296143,"software":0.07833080738782883,"quickly":0.28330928087234497,"repository":0.17197006940841675,"when":0.3322000801563263,"april":0.2298988699913025,"hack":0.03226395696401596,"number":0.011512535624206066,"universities":0.12309303879737854,"collections":0.06550033390522003,"##ead":0.17755159735679626,"massachusetts":0.038007788360118866,"id":0.2749236226081848,"text":0.019207220524549484,"fay":0.4011238217353821,"dates":0.1097077950835228,"utah":0.10763170570135117,"hash":0.09649420529603958,"managers":0.048172738403081894,"server":0.06080018728971481,"computer":8.669424569234252E-4,"library":0.6252824664115906,"file":0.1352214515209198,"bibliography":0.07063960283994675,"web":0.25746047496795654,"electronic":0.15097807347774506,"event":0.4382392168045044,"creator":0.1405920535326004,"topics":0.10169091075658798,"site":0.23403403162956238,"stored":0.044646069407463074,"cite":0.39168548583984375,"php":0.12772150337696075,"websites":0.25976818799972534,"li":0.006890921853482723,"##mana":0.02635863982141018,"statistics":0.15924787521362305,"date":0.48621752858161926,"quick":0.6519006490707397,"data":0.9039483070373535,"reference":0.12580865621566772,"cloud":0.07140999287366867,"find":0.011418276466429234,"publication":0.02644781395792961,"should":0.4729210138320923,"links":0.15330857038497925,"offset":0.38504543900489807,"resource":0.2230571210384369,"kind":0.09700614213943481,"dirt":0.3042531907558441,"format":0.2173396646976471,"archive":0.08260634541511536,"published":0.05468987673521042,"my":0.08052916824817657,"mormon":0.1961253583431244,"done":0.14879219233989716,"441":0.2913586497306824,"202":0.23394539952278137,"cleanup":0.02971869707107544,"absolutely":0.3848061263561249,"true":0.14969442784786224,"topic":0.1585649847984314,"managing":0.17729303240776062,"code":0.1556026190519333,"university":0.3348432779312134,"link":0.2814074158668518,"affiliated":0.15392540395259857,"their":0.013581964187324047,"storage":0.12990324199199677,"sql":0.21279653906822205,"451":0.10046929866075516,"running":0.004198556765913963,"database":0.4253959059715271,"computing":0.04671486094594002,"contributor":0.0059388624504208565,"filthy":0.09796293079853058,"##6":0.10912685096263885,"##8":0.033971790224313736,"##lib":0.33058395981788635,"value":0.14984647929668427,"sloppy":0.05236157402396202,"resources":0.10605408251285553,"clean":0.2688840329647064,"##set":0.0816301703453064,"affiliate":0.01715889573097229,"timothy":0.141994908452034}},"sort":[10.389838,1775084613306]},{"_index":"dspace-2026-02-09t19-23-02","_id":"dspace:1721.1-164819","_score":10.180051,"_source":{"summary":["Modern data analytics platforms increasingly adopt disaggregated architectures, storing data in cost-effective cloud object stores. While this approach enables a clean separation of concerns, allowing each layer to be independently managed and scaled, it introduces significant performance bottlenecks due to expensive data movement. Effective data layouts, which organize data to minimize unnecessary data reads, are thus critical to achieving high query performance. However, existing techniques typically rely on manually specified layouts, collect limited metadata, or lack mechanisms to dynamically adapt to changing data and workloads.\r\n\r\nThis thesis investigates adaptive, metadata-rich, expressive data layouts for cloud table storage. First, we introduce Pando, a correlation-aware layout technique that leverages rich metadata on query predicates to significantly improve data skipping. Next, we propose CopyRight, a partial replication strategy that selectively replicates subsets of data and optimizes each replica differently, efficiently serving heterogeneous query patterns. Finally, we describe Self-Organizing Data Containers (SDCs), a practical table storage layer for the cloud that incrementally reorganizes complex data layouts based on changes in data and workload distributions."],"timdex_provenance":{"source":"dspace","run_date":"2026-02-14","run_id":"17354145-cb2b-3380-1900-41a4b1a3f9d1_dc5b7070-742a-52bf-723c-99a2bbe3b2ec","run_record_offset":1},"citation":"Sudhir, Sivaprasad (2025-09): Optimizing Data Layouts for Evolving Cloud Table Storage. Massachusetts Institute of Technology. Thesis. https://dspace.mit.edu/handle/1721.1/164819","file_formats":["application/pdf"],"identifiers":[{"value":"https://hdl.handle.net/1721.1/164819","kind":"uri"},{"value":"https://orcid.org/0009-0005-4522-0394","kind":"orcid"}],"format":"electronic resource","embedding_full_record":{"##c":0.24149231612682343,"optimal":0.31896793842315674,"##d":0.2872020900249481,"objects":0.26138854026794434,"evolved":0.10343620926141739,"##i":0.06292740255594254,"##are":0.2910038232803345,"##frame":0.12272259593009949,"##l":0.021302854642271996,"##q":0.14921516180038452,"introduced":0.012815751135349274,"##s":0.02040053717792034,"retrieval":0.0756797045469284,"xml":0.004526963923126459,"record":0.34173333644866943,"complex":0.21374215185642242,"##x":0.2678435742855072,"##ances":0.03485210984945297,"persistent":0.0015232966979965568,"databases":0.08510152995586395,"#":0.08091883361339569,"engineers":0.05069326236844063,"google":0.1056135967373848,"analysis":0.13448773324489594,"version":0.008705832995474339,"bucket":0.06254454702138901,"correlation":0.35706138610839844,"aw":0.11002331972122192,"science":0.11374565213918686,"domain":0.07419329881668091,"institute":0.3371697664260864,"agile":0.16748744249343872,"##rre":0.09349370747804642,"compression":0.005501697771251202,"object":0.4361812472343445,"@":0.07707001268863678,"boston":0.012466255575418472,"hosting":0.09910810738801956,"achieve":0.0876418948173523,"cited":0.1832098811864853,"proven":0.26606032252311707,"bottle":0.23312625288963318,"manual":0.10556166619062424,"adaptive":0.5601310729980469,"citations":0.24495942890644073,"journal":0.03689362853765488,"##zing":0.16024313867092133,"hana":0.09396027773618698,"seo":0.03220886364579201,"computers":0.07865734398365021,"cb":0.14558827877044678,"_":0.14178478717803955,"minimize":0.2735673785209656,"replicate":0.38500988483428955,"d":0.05540130287408829,"r":0.061819661408662796,"information":0.15235738456249237,"##ance":0.3146308362483978,"analytic":0.17215481400489807,"db":0.12478005886077881,"##ani":0.08576413244009018,"di":0.2480970174074173,"##and":0.03611132875084877,"ds":0.6250885725021362,"analytics":0.4550188481807709,"layers":0.3656404912471771,"tim":0.561254620552063,"pan":0.7991642355918884,"skipping":0.5704744458198547,"##load":0.2601282596588135,"patterns":0.252685546875,"encoding":0.12812988460063934,"##cb":0.055495887994766235,"homogeneous":0.0553605780005455,"##bf":0.028664927929639816,"containers":0.5420688390731812,"##cs":0.3071833848953247,"formats":0.24080942571163177,"##net":0.036261964589357376,"analytical":0.018058497458696365,"aggregation":0.07327170670032501,"##da":0.05052961781620979,"content":0.2334141731262207,"skipped":0.3145965337753296,"layered":0.08941558003425598,"load":0.09254731982946396,"sourced":0.01727648265659809,"##ci":0.42414847016334534,"authorship":0.04016055539250374,"digital":0.3580097258090973,"effectiveness":0.146780863404274,"practical":0.2836502194404602,"citation":0.3313540816307068,"perform":0.020611073821783066,"rich":0.17868074774742126,"permission":0.04103619232773781,"evolution":0.31523579359054565,"##de":0.5181726813316345,"pdf":0.27886849641799927,"berkeley":0.06683076173067093,"coffee":0.07068950682878494,"publish":0.05689543858170509,"##do":0.5468977093696594,"contributors":0.09080657362937927,"hd":0.138924241065979,"##ero":0.0942017063498497,"##gate":0.03288658335804939,"subset":0.1678312122821808,"##eous":0.1197468712925911,"##ental":0.08849960565567017,"copyright":0.6112802028656006,"approach":0.2571250796318054,"improved":0.11980676651000977,"tables":0.5688241124153137,"##ifier":0.07989779114723206,"##dos":0.18629246950149536,"thesis":0.3510429561138153,"id":0.3941951096057892,"https":0.028980961069464684,"algorithm":0.0845080241560936,"reduce":0.030456770211458206,"io":0.03614920377731323,"electrical":0.1753012090921402,"distributed":0.053788818418979645,"advisors":0.03273779898881912,"handle":0.2274600714445114,"propose":0.12950102984905243,"distributions":0.006874723359942436,"partial":0.2712439000606537,"hash":0.07666335999965668,"server":0.1668967455625534,"algorithms":0.06941544264554977,"semantic":0.009665578603744507,"skip":0.5399379730224609,"file":0.31619253754615784,"##rang":0.02700962871313095,"rights":0.09053926169872284,"electronic":0.20555634796619415,"table":0.7258259654045105,"##neck":0.23785334825515747,"stores":0.19389162957668304,"framework":0.06748900562524796,"##ent":0.011984942480921745,"stored":0.4392138123512268,"cite":0.2589486837387085,"php":0.1246982291340828,"movement":0.07024194300174713,"replica":0.3853139579296112,"scaled":0.2583388388156891,"##gre":0.006946501322090626,"use":0.05246197059750557,"autonomous":0.04779893904924393,"platforms":0.21232038736343384,"arrangement":0.11452334374189377,"ma":0.14236320555210114,"##gated":0.05919104442000389,"publication":0.26416337490081787,"links":0.1168990507721901,"##ix":0.04283112287521362,"read":0.11392813175916672,"author":0.005124954041093588,"lever":0.047128528356552124,"202":0.09494148939847946,"improve":0.19787470996379852,"oriented":0.005946191493421793,"harvard":0.12021857500076294,"collect":0.0367664135992527,"leverage":0.12915422022342682,"code":0.11764036118984222,"##rem":0.15288345515727997,"university":0.21453793346881866,"##ducted":0.05077028274536133,"nt":0.03587085381150246,"technique":0.25010690093040466,"storage":0.664306640625,"sql":0.30232128500938416,"effective":0.5217835903167725,"design":0.211115762591362,"department":0.1301238238811493,"or":0.10374488681554794,"unnecessary":0.21458150446414948,"##loading":0.053785763680934906,"application":0.13735057413578033,"##ls":0.0345272533595562,"strategy":0.2950744926929474,"##set":0.07817131280899048,"handles":0.07458522170782089,"authored":0.009289941750466824,"metadata":0.4663638174533844,"inform":0.0352148599922657,"java":0.05060293525457382,"identification":0.044286176562309265,"contribution":1.957742788363248E-4,"api":0.13799285888671875,"arrangements":0.09138143062591553,"publishing":0.1630202978849411,"cache":0.11390167474746704,"adopt":0.03924081474542618,"##bbe":0.014609197154641151,"complexity":0.0326266773045063,"##cated":0.024558864533901215,"sud":0.32432225346565247,"document":0.03703418746590614,"之":0.08739982545375824,"##des":0.2296198159456253,"collecting":0.004397217649966478,"sd":0.5052663683891296,"permitted":0.33546653389930725,"si":0.27355116605758667,"managed":0.06154647096991539,"mit":0.6011233925819397,"dissertation":0.06632443517446518,"samuel":0.2350810468196869,"attribute":0.05271819978952408,"mechanism":0.02889232710003853,"##ded":0.13108870387077332,"email":0.06578194350004196,"scaling":0.17781731486320496,"consolidate":0.027436576783657074,"strategies":0.113438181579113,"##hema":0.23263543844223022,"##dicate":0.36283668875694275,"store":0.32825562357902527,"dept":0.1273798644542694,"evolve":0.3226865828037262,"##pr":0.260892391204834,"##spar":0.0070100268349051476,"ibm":0.18703199923038483,"##re":0.09589269012212753,"project":0.040024153888225555,"run":0.25628039240837097,"source":0.25433892011642456,"research":0.10116157680749893,"##21":0.023047372698783875,"apache":0.09287525713443756,"##19":0.29123806953430176,"dynamic":0.26993340253829956,"cambridge":0.06846900284290314,"##imi":0.2663104832172394,"ur":0.32422634959220886,"##erate":0.02519875578582287,"##sd":0.05668404698371887,"pre":0.029688265174627304,"oracle":0.1251661330461502,"query":0.40975427627563477,"adapt":0.12316759675741196,"engineering":0.2697928249835968,"duplicate":0.2036464512348175,"##table":0.22901959717273712,"164":0.020211847499012947,"technologies":0.04454812780022621,"opt":0.2722862958908081,"improving":0.01237229723483324,"spaces":0.13646428287029266,"citing":0.07494500279426575,"organise":0.17359448969364166,"correlated":0.15613079071044922,"que":0.04446617141366005,"memory":0.17828767001628876,"records":0.3434605598449707,"mass":0.29878172278404236,"##his":0.03521869331598282,"##hir":0.29539191722869873,"##dicated":0.10428228974342346,"linux":0.07176382839679718,"effectively":0.16205783188343048,"technology":0.14704911410808563,"engineer":0.04916620999574661,"storing":0.38104721903800964,"layout":0.7799280881881714,"##45":0.05613727867603302,"1721":0.3745228350162506,"##46":0.03330061212182045,"what":0.06060778349637985,"relational":0.0040364651940763,"container":0.49311894178390503,"software":0.06534212827682495,"repository":0.06800449639558792,"##gen":0.06079591065645218,"optimization":0.31991299986839294,"het":0.31244707107543945,"##plication":0.045109134167432785,"enable":0.018832581117749214,"massachusetts":0.6343134641647339,"##va":0.2362612783908844,"azure":0.24342027306556702,"1735":0.20041684806346893,"##oud":0.3017263412475586,"method":0.11747122555971146,"##tech":0.021458473056554794,"##sing":0.07965080440044403,"rely":0.08859732002019882,"##vas":0.05118789151310921,"##alia":0.046114541590213776,"madden":0.39686474204063416,"methods":0.09474556148052216,"pattern":0.17698822915554047,"distribution":0.04538111761212349,"layer":0.5433851480484009,"##ign":0.14252465963363647,"specified":0.009819184429943562,"advisor":0.2219105064868927,"computer":0.2410481870174408,"modern":0.318084716796875,"web":0.06391556560993195,"copy":0.0919894352555275,"architecture":0.32910728454589844,"replication":0.49000170826911926,"##ifiers":0.06591592729091644,"efficient":0.006002710200846195,"organizes":0.2346716672182083,"evolving":0.4406088590621948,"##wat":0.03919680044054985,"organizer":0.0716496929526329,"organization":0.16292889416217804,"organized":0.2512205243110657,"self":0.5482035279273987,"##org":0.3067812919616699,"organizing":0.39903122186660767,"1648":0.4150104224681854,"queue":0.0555993877351284,"##lla":0.10509754717350006,"statistics":0.03485767915844917,"date":0.1782480776309967,"data":0.8925544619560242,"space":0.32082974910736084,"cloud":0.7172479629516602,"protocol":0.09842625260353088,"expressive":0.3634095788002014,"1653":0.041055675595998764,"1652":0.10437506437301636,"##code":0.05871046334505081,"publishers":0.03331702575087547,"##ze":0.1524764597415924,"tag":0.04246281832456589,"manually":0.2300417572259903,"offset":0.4211694002151489,"resource":0.2606988847255707,"kind":0.24382555484771729,"##pace":0.5771853923797607,"format":0.3028789758682251,"published":0.16174545884132385,"##pro":0.1615135371685028,"proposed":0.03647463023662567,"techniques":0.23815201222896576,"publisher":0.15755103528499603,"files":0.15452106297016144,"##duction":0.3013398051261902,"scala":0.15700779855251312,"instances":0.04008319228887558,"##zed":0.14709077775478363,"link":0.028665516525506973,"caf":0.4966190457344055,"scale":0.03247199207544327,"clouds":0.5771607756614685,"platform":0.28267577290534973,"##oop":0.17476539313793182,"aware":0.3204469084739685,"database":0.5004675984382629,"computing":0.25165945291519165,"##2":0.007380043156445026,"contributor":0.028220346197485924,"relies":0.019577080383896828,"organize":0.30881839990615845,"value":0.42455965280532837,"##gation":0.05702606961131096,"sam":0.026096927002072334,"inc":0.10717029869556427,"##ass":0.09972890466451645,"sap":0.08082880079746246,"cost":0.040225543081760406,"selective":0.31799954175949097,"##zation":0.0020445839036256075,"implementation":0.015150299295783043,"reads":0.25097641348838806,"##ash":0.005936117842793465,"resources":0.06681738048791885,"approaches":0.18937011063098907,"##asa":0.24941857159137726,"cloudy":0.07466921955347061,"performance":0.3397291302680969,"responsive":0.050710584968328476,"variable":0.07320675998926163,"independently":0.011299625970423222,"timothy":0.1863427311182022,"evolutionary":0.04480526223778725,"methodology":0.020644959062337875},"dates":[{"kind":"Publication date","value":"2025-09"}],"source":"DSpace@MIT","title":"Optimizing Data Layouts for Evolving Cloud Table Storage","source_link":"https://dspace.mit.edu/handle/1721.1/164819","content_type":["Thesis"],"rights":[{"description":"In Copyright - Educational Use Permitted","kind":"useAndReproduction"}],"publishers":[{"name":"Massachusetts Institute of Technology"}],"links":[{"url":"https://hdl.handle.net/1721.1/164819","kind":"Digital object URL","text":"Digital object URL"}],"contributors":[{"value":"Cafarella, Michael J.","kind":"advisor"},{"value":"Madden, Samuel R.","kind":"advisor"},{"value":"Sudhir, Sivaprasad","kind":"author"},{"value":"Massachusetts Institute of Technology. Department of Electrical Engineering and Computer Science","kind":"department"}],"timdex_record_id":"dspace:1721.1-164819"},"sort":[10.180051,1756684800000]},{"_index":"dspace-2026-02-09t19-23-02","_id":"dspace:1721.1-164767","_score":10.08786,"_source":{"summary":["Thanks to the advances in generative architectures and large language models, data scientists can now code pipelines of AI operations to process large collections of unstructured data. Recent progress has seen the rise of declarative AI frameworks (e.g., Palimpzest, Lotus, and DocETL) to build optimized and increasingly complex pipelines, but these systems often remain accessible only to expert programmers. In this demonstration, we present PalimpChat, a chat-based interface to Palimpzest that bridges this gap by letting users create and run sophisticated AI pipelines through natural language alone. By integrating Archytas, a ReAct-based reasoning agent, and Palimpzest's suite of relational and LLM-based operators, PalimpChat provides a practical illustration of how a chat interface can make declarative AI frameworks truly accessible to non-experts.\r\nOur demo system is publicly available online. At SIGMOD'25, participants can explore three real-world scenarios-scientific discovery, legal discovery, and real estate search-or apply PalimpChat to their own datasets. In this paper, we focus on how PalimpChat, supported by the Palimpzest optimizer, simplifies complex AI workflows such as extracting and analyzing biomedical data."],"timdex_provenance":{"source":"dspace","run_date":"2026-02-11","run_id":"c13f46c9-4a92-bb7e-b2cf-a85bae3c321c_59e5b3cf-7ebf-76f8-2407-94ea3ec591ed","run_record_offset":12},"languages":["en"],"citation":"Chunwei Liu, Gerardo Vitagliano, Brandon Rose, Matthew Printz, David Andrew Samson, and Michael Cafarella. 2025. PalimpChat: Declarative and Interactive AI analytics. In Companion of the 2025 International Conference on Management of Data (SIGMOD/PODS '25). Association for Computing Machinery, New York, NY, USA, 183–186.","file_formats":["application/pdf"],"identifiers":[{"value":"979-8-4007-1564-8","kind":"isbn"},{"value":"https://hdl.handle.net/1721.1/164767","kind":"uri"},{"value":"PUBLISHER_POLICY","kind":"mitlicense"}],"format":"electronic resource","embedding_full_record":{"dec":0.5954597592353821,"optimal":0.134453684091568,"objects":0.13916996121406555,"##i":0.10554685443639755,"##are":0.26956647634506226,"scenarios":0.14675582945346832,"##frame":0.05123161897063255,"##l":0.19386419653892517,"##m":0.2923606336116791,"analyzing":0.1156606450676918,"##q":0.06404843926429749,"##t":0.4171992242336273,"complex":0.26753705739974976,"record":0.21629448235034943,"##x":0.3090686798095703,"sci":0.09362266957759857,"##z":0.06291191279888153,"##ances":0.04329901933670044,"##pod":0.13230951130390167,"ac":0.3406832814216614,"#":0.037347178906202316,"ai":0.6726658940315247,"analysis":0.294997900724411,"5":0.11133122444152832,"science":0.1724609136581421,"domain":0.05292506143450737,"institute":0.26772886514663696,"object":0.2550002634525299,"@":0.10574298352003098,"accessible":0.433545857667923,"statistical":0.07632161676883698,"cited":0.23701176047325134,"proven":0.31021732091903687,"coding":0.21894946694374084,"search":0.16935589909553528,"citations":0.2843496799468994,"journal":0.03335770219564438,"systems":0.11979752033948898,"vita":0.3417627513408661,"##zing":0.034766051918268204,"##flow":0.29700782895088196,"huang":0.009352168068289757,"computers":0.08163406699895859,"policy":0.13479433953762054,"_":0.09925118833780289,"d":0.048542317003011703,"r":0.011955215595662594,"information":0.06478222459554672,"arch":0.5317913293838501,"##ance":0.31939050555229187,"analytic":0.29517000913619995,"publications":9.766384755494073E-5,"##as":0.31896665692329407,"##met":0.011232072487473488,"##mer":0.12373972684144974,"##and":0.06540070474147797,"language":0.5579164028167725,"developed":0.041048355400562286,"robotic":0.048586949706077576,"ds":0.5457614660263062,"analytics":0.48855459690093994,"chinese":0.10345775634050369,"gong":0.033982738852500916,"samson":0.21348853409290314,"legal":0.30751746892929077,"tim":0.49699676036834717,"##bot":0.08093805611133575,"programming":0.2231278270483017,"conversation":0.14458097517490387,"computational":0.1415461152791977,"searches":0.03405192494392395,"turing":0.03330662474036217,"publicly":0.07334821671247482,"##anal":0.007858592085540295,"andrew":0.2399948090314865,"users":0.2386600226163864,"article":0.13753482699394226,"chu":0.009590883739292622,"labs":0.02303052321076393,"##ali":0.18210850656032562,"##lar":0.28971996903419495,"formats":0.22985851764678955,"analytical":0.18402650952339172,"companion":0.42733386158943176,"##glia":0.18256431818008423,"interface":0.43063464760780334,"content":0.22030377388000488,"symposium":0.0934908464550972,"##lab":0.09397801011800766,"##ch":0.026198524981737137,"engine":0.008886734023690224,"authorship":0.12724699079990387,"sim":0.11042779684066772,"##con":0.009827906265854836,"##com":0.035595327615737915,"digital":0.34351661801338196,"practical":0.20203423500061035,"##mbo":0.07753720134496689,"citation":0.3653000295162201,"message":0.12819385528564453,"michael":0.16396722197532654,"##de":0.4860161542892456,"print":0.2819647789001465,"pdf":0.27501189708709717,"management":0.3871690332889557,"2015":0.03595445305109024,"coffee":0.1830432415008545,"publish":0.11892998963594437,"analyst":0.14669854938983917,"developer":0.018960915505886078,"contributors":0.13979411125183105,"hd":0.08719979971647263,"expert":0.3016442060470581,"copyright":0.13065338134765625,"advanced":0.09304313361644745,"bio":0.05869514122605324,"zhang":0.13505667448043823,"##ifies":0.13492554426193237,"##ifier":0.08892931044101715,"advances":0.17074204981327057,"model":0.1690206229686737,"ic":0.008817754685878754,"id":0.3341974914073944,"text":0.03729218244552612,"flow":0.15848687291145325,"##et":0.3442857265472412,"algorithm":0.09601767361164093,"##ods":0.15730684995651245,"python":0.04934883490204811,"large":0.05192487686872482,"programmer":0.10488651692867279,"handle":0.1578153669834137,"script":0.06321126967668533,"intelligence":0.4469160735607147,"messaging":0.21617400646209717,"system":0.22288846969604492,"anal":0.027875926345586777,"analyze":0.08985153585672379,"integration":0.1768156737089157,"doc":0.346474826335907,"messages":0.09190214425325394,"machinery":0.1864054948091507,"authors":0.09388116002082825,"algorithms":0.20159579813480377,"semantic":0.08245482295751572,"server":0.046397119760513306,"file":0.260295033454895,"legally":0.03997879475355148,"##gm":0.3139878809452057,"rights":0.13036134839057922,"electronic":0.17988044023513794,"share":0.0691070631146431,"agents":0.12257324159145355,"framework":0.5020638108253479,"##ent":0.039861466735601425,"messenger":0.03087647445499897,"discovery":0.3118858337402344,"machine":0.13117191195487976,"cite":0.30944591760635376,"php":0.0609348826110363,"rose":0.11632362008094788,"logic":0.14972247183322906,"ll":0.42618852853775024,"genera":0.40238672494888306,"codes":0.01576380431652069,"##ive":0.06803474575281143,"use":0.019859859719872475,"autonomous":0.08108963817358017,"shen":0.013750644400715828,"lab":0.08225709199905396,"chun":0.3402756452560425,"hacking":0.05528758093714714,"automation":0.11218701303005219,"ma":0.01654357649385929,"publication":0.3209046721458435,"##tive":0.18090465664863586,"links":0.09170857071876526,"international":0.39598584175109863,"##ix":0.0060868775472044945,"matthew":0.17196431756019592,"mp":0.05403964966535568,"author":0.18715205788612366,"estate":0.16160795092582703,"applicable":0.03518630564212799,"##ke":0.03282433748245239,"real":0.020910346880555153,"tool":0.11538107693195343,"coded":0.0852227658033371,"license":0.029781823977828026,"202":0.3740224540233612,"simplified":0.19532614946365356,"scientists":0.2706853151321411,"harvard":0.07442791759967804,"##cha":0.5567348003387451,"code":0.29890283942222595,"university":0.11709660291671753,"bot":0.08870883285999298,"ny":0.04755084216594696,"demo":0.3904772102832794,"sql":0.1337837129831314,"##ma":0.011629858054220676,"##mb":0.09094563871622086,"##mc":0.0741843655705452,"##me":0.033737149089574814,"intelligent":0.1790977120399475,"##ml":0.02497350051999092,"application":0.16276700794696808,"##ls":0.06648015230894089,"online":0.018298696726560593,"machines":0.07244321703910828,"##set":0.24582719802856445,"authored":0.11759733408689499,"inform":0.012436202727258205,"expertise":0.14155475795269012,"##mo":0.05500169098377228,"lambda":0.018720852211117744,"##mp":0.5209788084030151,"java":0.14465363323688507,"contribution":0.09299298375844955,"##mt":0.10682643204927444,"programmers":0.20643799006938934,"api":0.22489520907402039,"publishing":0.23265480995178223,"recent":0.00533339474350214,"based":0.35087138414382935,"models":0.10920455306768417,"##od":0.30725428462028503,"##no":0.07732182741165161,"processing":0.2057042270898819,"demonstration":0.2758650779724121,"##ructured":0.10543014854192734,"complexity":0.05499844625592232,"sophisticated":0.3168146014213562,"conference":0.5271146893501282,"access":0.24768197536468506,"25":0.19571137428283691,"pod":0.3803131580352783,"document":0.08505140244960785,"association":0.25894787907600403,"##des":0.13781383633613586,"##pl":0.12754309177398682,"arc":0.027421122416853905,"scenario":0.025307660922408104,"si":0.34429246187210083,"mit":0.5564423203468323,"u2":0.025754446163773537,"conferences":0.1558762937784195,"email":0.04601770266890526,"participants":0.14264541864395142,"languages":0.3048386871814728,"dept":0.003600765485316515,"biomedical":0.3553627133369446,"##pp":0.02900342456996441,"##01":0.1607198864221573,"automated":0.03295006975531578,"ibm":0.1677124798297882,"##tream":0.06785175204277039,"progress":0.19664683938026428,"experts":0.1724136769771576,"chart":0.021671980619430542,"supported":0.26801827549934387,"agent":0.21048584580421448,"medical":0.003981953486800194,"##re":0.04916198551654816,"##tch":0.034589752554893494,"available":0.23970697820186615,"run":0.3043859601020813,"source":0.2121095359325409,"operator":0.2842370569705963,"participant":0.024803435429930687,"##21":0.022972777485847473,"apache":0.005948654375970364,"ui":0.12666082382202148,"liu":0.3619098961353302,"un":0.08916070312261581,"cambridge":0.0794227123260498,"##imi":0.18746007978916168,"ur":0.3109990358352661,"oracle":0.08491761237382889,"query":0.05588340014219284,"collection":0.22929976880550385,"bridges":0.042909666895866394,"##sp":0.04726104810833931,"164":0.477152019739151,"##32":0.03595387190580368,"technologies":0.03787704184651375,"opt":0.14535875618457794,"extract":0.20620572566986084,"reactive":0.19044195115566254,"##25":0.07246998697519302,"laboratory":0.09087370336055756,"spaces":0.041228532791137695,"citing":0.10804896801710129,"demonstrate":0.14692117273807526,"support":0.025300128385424614,"analysts":0.010002309456467628,"records":0.13014982640743256,"scientist":0.22790828347206116,"isbn":0.17634262144565582,"mass":0.010078338906168938,"##tp":0.09383145719766617,"172":0.04603071138262749,"non":0.015877271071076393,"##ts":0.038973964750766754,"1712":0.026136890053749084,"##st":0.02617635950446129,"##zers":0.07181835174560547,"1717":0.058430854231119156,"1716":0.01737270876765251,"convention":0.08478158712387085,"interfaces":0.21349747478961945,"technology":0.07740594446659088,"183":0.17157115042209625,"##tt":0.08867605030536652,"1722":0.11753850430250168,"artificial":0.5480661392211914,"1721":0.41380810737609863,"##46":0.2297029346227646,"##47":0.0012416308745741844,"##pods":0.1101800799369812,"pods":0.5331591963768005,"relational":0.2555985152721405,"applications":0.015597726218402386,"software":0.23809322714805603,"funnel":0.16190598905086517,"##wei":0.25616028904914856,"reasoning":0.3137255311012268,"interactive":0.5757089853286743,"react":0.44707754254341125,"##59":0.036365121603012085,"collections":0.26848623156547546,"optimization":0.178436279296875,"massachusetts":0.43132758140563965,"pali":0.6572268009185791,"##nse":0.061576250940561295,"natural":0.23734675347805023,"method":0.011352050118148327,"##lice":0.1568196415901184,"##tech":0.04942794889211655,"extraction":0.14612892270088196,"##mps":0.35018131136894226,"demos":0.35194098949432373,"methods":0.03140057250857353,"tools":0.09678442776203156,"##85":0.07395543158054352,"commons":0.28012728691101074,"##86":0.1035836786031723,"computer":0.26683780550956726,"operators":0.31635692715644836,"web":0.035767264664173126,"demonstrated":0.0859009250998497,"architecture":0.25793376564979553,"##bution":0.005822801496833563,"##ifiers":0.05906414985656738,"##yt":0.35118788480758667,"pipeline":0.5732517242431641,"chat":0.5982276201248169,"yong":0.1006295382976532,"chan":0.062144190073013306,"queue":0.10439760237932205,"##lla":0.15081161260604858,"statistics":0.016990603879094124,"date":0.1968129277229309,"##ifying":0.05481274053454399,"data":0.6942856907844543,"##kit":0.13248278200626373,"lotus":0.41086724400520325,"space":0.22925597429275513,"cloud":0.026967184618115425,"protocol":0.10797980427742004,"brandon":0.3680271804332733,"##code":0.09118317812681198,"publishers":0.14358286559581757,"create":0.11449751257896423,"##ze":0.044128142297267914,"tag":0.017904384061694145,"offset":0.38137492537498474,"##ative":0.3410850167274475,"resource":0.26426202058792114,"kind":0.26887238025665283,"##pace":0.5417245030403137,"format":0.2596947252750397,"published":0.27859288454055786,"mining":0.0017629729118198156,"##pro":0.24356117844581604,"##zes":0.419977605342865,"publisher":0.2578429877758026,"##zer":0.1413974016904831,"files":0.0785248875617981,"managing":0.10123620182275772,"##duction":0.29547420144081116,"scala":0.0892665758728981,"scientific":0.2104766070842743,"##zed":0.15271644294261932,"link":0.04365725815296173,"caf":0.5194419026374817,"interact":0.04496682435274124,"conversations":0.20722037553787231,"platform":0.1088116466999054,"##oop":0.020076099783182144,"integrated":0.15415960550308228,"##ference":0.06558230519294739,"computing":0.3104116916656494,"database":0.2472817599773407,"operations":0.2490500658750534,"contributor":0.07452178746461868,"paper":0.060500118881464005,"##5":0.46795183420181274,"##7":0.15998373925685883,"##9":0.0018509585643187165,"david":0.1052115187048912,"value":0.4929240643978119,"##ass":0.02636086940765381,"chen":0.0362897552549839,"process":0.10015250742435455,"implementation":0.05677249655127525,"resources":0.13578371703624725,"york":0.22204461693763733,"##mble":0.06305328011512756,"gerard":0.2740379273891449,"interaction":0.10071361809968948,"cheng":0.1099993884563446,"user":0.16757832467556,"chatting":0.07477272301912308,"timothy":0.0661427304148674,"methodology":0.06377092003822327},"dates":[{"kind":"Publication date","value":"2025-06-22"}],"source":"DSpace@MIT","title":"PalimpChat: Declarative and Interactive AI analytics","source_link":"https://dspace.mit.edu/handle/1721.1/164767","content_type":["Article"],"rights":[{"description":"Creative Commons Attribution-Noncommercial-ShareAlike","kind":"useAndReproduction"}],"publishers":[{"name":"ACM|Companion of the 2025 International Conference on Management of Data"}],"links":[{"url":"https://hdl.handle.net/1721.1/164767","kind":"Digital object URL","text":"Digital object URL"}],"contributors":[{"value":"Liu, Chunwei","kind":"author"},{"value":"Vitagliano, Gerardo","kind":"author"},{"value":"Rose, Brandon","kind":"author"},{"value":"Printz, Matthew","kind":"author"},{"value":"Samson, David Andrew","kind":"author"},{"value":"Cafarella, Michael","kind":"author"},{"value":"Massachusetts Institute of Technology. Computer Science and Artificial Intelligence Laboratory","kind":"department"}],"timdex_record_id":"dspace:1721.1-164767"},"sort":[10.08786,1750550400000]},{"_index":"dspace-2026-02-09t19-23-02","_id":"dspace:1721.1-154072","_score":9.972086,"_source":{"summary":["Timeseries analytics is important in many real-world applications. Recently, the Transformer model, popular in natural language processing, has been leveraged to learn high quality feature embeddings from timeseries: embeddings are key to the performance of various timeseries analytics tasks such as similarity-based timeseries queries within vector databases. However, quadratic time and space complexities limit Transformers' scalability, especially for long timeseries. To address these issues, we develop a timeseries analytics tool, RITA, which uses a novel attention mechanism, named group attention, to address this scalability issue. Group attention dynamically clusters the objects based on their similarity into a small number of groups and approximately computes the attention at the coarse group granularity. It thus significantly reduces the time and space complexity, yet provides a theoretical guarantee on the quality of the computed attention. The dynamic scheduler of RITA continuously adapts the number of groups and the batch size in the training process, ensuring group attention always uses the fewest groups needed to meet the approximation quality requirement. Extensive experiments on various timeseries datasets and analytics tasks demonstrate that RITA outperforms the state-of-the-art in accuracy and is significantly faster --- with speedups of up to 63X."],"timdex_provenance":{"source":"dspace","run_date":"2026-04-15","run_id":"a816f3dc-51ac-7e5f-cec8-1086ffc54274_861de409-c771-2e2c-c416-93c81a0885e3","run_record_offset":866},"languages":["en"],"citation":"Jiaming Liang, Lei Cao, Samuel Madden, Zachary Ives, and Guoliang Li. 2024. RITA: Group Attention is All You\r\nNeed for Timeseries Analytics. Proc. ACM Manag. Data 2, 1 (SIGMOD), Article 62 (February 2024), 28 pages.","file_formats":["application/pdf"],"identifiers":[{"value":"2836-6573","kind":"issn"},{"value":"https://hdl.handle.net/1721.1/154072","kind":"uri"},{"value":"PUBLISHER_CC","kind":"mitlicense"}],"format":"electronic resource","embedding_full_record":{"authored":0.06250414252281189,"cluster":0.3495125472545624,"accurate":0.3165164589881897,"objects":0.2874133288860321,"accuracy":0.40411248803138733,"##i":0.0206555537879467,"##frame":0.10140614956617355,"##m":0.4147489070892334,"analyzing":0.01956622302532196,"##q":0.16737623512744904,"lei":0.14526407420635223,"##r":0.2237011343240738,"dynamics":0.16136816143989563,"lambda":0.04746478050947189,"java":0.11454816907644272,"contribution":0.041250698268413544,"stats":0.062352120876312256,"##ibility":0.03597671166062355,"##ms":0.09958906471729279,"record":0.22096696496009827,"complex":0.19355466961860657,"##ancy":0.01587717793881893,"##x":0.22792062163352966,"sci":0.049521367996931076,"##ances":0.06314469128847122,"api":0.037162624299526215,"publishing":0.18743592500686646,"temporal":0.016084695234894753,"limitations":0.09740409255027771,"databases":0.16235794126987457,"based":0.14621146023273468,"models":0.131923645734787,"ac":0.5911601781845093,"grouped":0.19910621643066406,"#":0.06761182844638824,"##od":0.21180392801761627,"ai":0.2912802994251251,"analysis":0.4090780019760132,"processor":0.017450818791985512,"quality":0.4198233187198639,"node":0.13251769542694092,"science":0.15685991942882538,"##ratic":0.1415540724992752,"domain":0.06314707547426224,"processing":0.2763349413871765,"institute":0.2266305536031723,"agile":0.08163060247898102,"jiang":0.010900731198489666,"object":0.27523937821388245,"@":0.10217314213514328,"complexity":0.3342492878437042,"statistical":0.24916952848434448,"experiments":0.19510310888290405,"association":0.15871058404445648,"cited":0.15624725818634033,"proven":0.3052966892719269,"##des":0.17730998992919922,"##iling":0.07319483160972595,"adaptive":0.05641819164156914,"##eries":0.4600696563720703,"citations":0.2505398690700531,"journal":0.07588277757167816,"si":0.28196921944618225,"mit":0.6213510632514954,"##ries":0.030553609132766724,"samuel":0.3895134925842285,"vector":0.37891143560409546,"attribute":0.023838788270950317,"mechanism":0.33444035053253174,"embedded":0.16522248089313507,"##ities":0.09591478854417801,"huang":0.010517638176679611,"##ded":0.004028679803013802,"limits":0.1151745468378067,"email":0.10995126515626907,"computers":0.10220826417207718,"key":0.03652484714984894,"_":0.11431582272052765,"cc":0.05286381393671036,"ce":0.031241867691278458,"scaling":0.018879886716604233,"languages":0.21441806852817535,"learn":0.008196902461349964,"fastest":0.29466512799263,"ming":0.03537623584270477,"gran":0.24730561673641205,"dept":0.0562407448887825,"q":0.01297533418983221,"similarities":0.3003213405609131,"r":0.020216794684529305,"fast":0.21161267161369324,"mana":0.14568200707435608,"ibm":0.1285751760005951,"metric":0.0805630311369896,"series":0.295034795999527,"##ance":0.34226226806640625,"analytic":0.30908340215682983,"novel":0.23361320793628693,"db":0.17235039174556732,"publications":0.010597790591418743,"calculation":0.03736814484000206,"approximate":0.2184886336326599,"##oza":0.028477225452661514,"project":0.00811498798429966,"language":0.34823083877563477,"run":0.14940738677978516,"##ding":0.2321685403585434,"source":0.22678668797016144,"developed":0.042273182421922684,"##ally":0.030514847487211227,"research":0.01528649590909481,"ds":0.5832194685935974,"##21":0.009358201175928116,"analytics":0.5393105149269104,"compute":0.08364332467317581,"chinese":0.15017886459827423,"##16":0.12506794929504395,"scheduling":0.33843177556991577,"tim":0.5090839266777039,"dynamic":0.5430446863174438,"cambridge":0.026996610686182976,"ur":0.24381211400032043,"##ao":0.01985800266265869,"computational":0.11111067235469818,"oracle":0.10116423666477203,"need":0.13346397876739502,"query":0.3319386839866638,"batch":0.4581168293952942,"em":0.33100077509880066,"ives":0.4862979054450989,"281":0.16818612813949585,"pro":0.18419373035430908,"##anal":0.053302157670259476,"encoding":0.048612311482429504,"283":0.3146224617958069,"##table":0.1278245896100998,"article":0.13826727867126465,"284":0.0848110169172287,"286":0.09911919385194778,"##rs":0.06386101990938187,"laboratory":0.11142909526824951,"##ular":0.10169627517461777,"sparse":0.05134239420294762,"spaces":0.03653572499752045,"citing":0.023297984153032303,"62":0.033033207058906555,"useful":0.026025790721178055,"que":0.14146919548511505,"analysts":0.10471880435943604,"formats":0.14095844328403473,"analytical":0.2212863713502884,"records":0.17034438252449036,"scheduled":0.26890766620635986,"needed":0.05326158180832863,"importance":0.053058359771966934,"mass":0.10226316004991531,"training":0.3200605809688568,"aggregation":0.10368151217699051,"##forms":0.07589272409677505,"speed":0.23687078058719635,"content":0.20689283311367035,"##nee":0.2101256251335144,"rita":0.8143132925033569,"##lab":0.10486173629760742,"similarity":0.49430525302886963,"authorship":0.13957995176315308,"schedules":0.13928920030593872,"linux":0.055038005113601685,"1717":0.032059162855148315,"clusters":0.3174743354320526,"digital":0.2832144796848297,"citation":0.3287360966205597,"perform":0.0426170751452446,"technology":0.03959401324391365,"##time":0.09806318581104279,"##de":0.4324119985103607,"schedule":0.3806225061416626,"1722":0.008126760832965374,"1721":0.40576377511024475,"artificial":0.36693042516708374,"##ery":0.12244746088981628,"pdf":0.26239851117134094,"what":0.019376078620553017,"china":0.037311624735593796,"regression":0.07888711988925934,"publish":0.0869990736246109,"##inator":0.010005771182477474,"analyst":0.2311987727880478,"time":1.0289815664291382,"contributors":0.06709376722574234,"xu":0.01828502118587494,"86":0.1597411185503006,"applications":0.16427397727966309,"copyright":0.03596006706357002,"jia":0.2096569687128067,"modeling":0.09351407736539841,"software":0.2651221454143524,"##ble":0.16242289543151855,"experimental":0.06705167144536972,"zhang":0.08915107697248459,"processors":0.0030856637749820948,"number":0.08318009227514267,"##ifier":0.08722248673439026,"##lian":0.2367670089006424,"experiment":0.012016255408525467,"massachusetts":0.45711034536361694,"model":0.35854047536849976,"id":0.2733488380908966,"proceedings":0.23006024956703186,"##er":0.18789052963256836,"liang":0.3082938492298126,"tasks":0.0965961292386055,"##nse":0.01624121144413948,"hunan":0.006701237987726927,"algorithm":0.21224406361579895,"##ods":0.17049872875213623,"reduce":0.13997238874435425,"similar":0.38145825266838074,"transformers":0.520793080329895,"python":0.002388768596574664,"natural":0.18719765543937683,"method":0.06968694180250168,"##lice":0.057775333523750305,"handle":0.11303234100341797,"grouping":0.10614132881164551,"intel":0.023486312478780746,"script":0.03678879141807556,"creative":0.02230140194296837,"intelligence":0.32734909653663635,"##sing":0.03468881919980049,"issn":0.29554906487464905,"anal":0.08510633558034897,"analyze":0.17685604095458984,"madden":0.42901378870010376,"hash":0.01419819239526987,"machinery":0.14156962931156158,"authors":0.07760780304670334,"##erie":0.019393229857087135,"ji":0.009977735579013824,"guo":0.3011418282985687,"algorithms":0.17265206575393677,"server":0.10840509831905365,"##per":0.14023108780384064,"computed":0.2838497459888458,"methods":0.0018763651605695486,"1086":0.04168575257062912,"tools":0.3211768865585327,"commons":0.20641188323497772,"computer":0.26961567997932434,"file":0.23983904719352722,"feature":0.20827408134937286,"##gm":0.28849542140960693,"electronic":0.16337870061397552,"##ifiers":0.052070364356040955,"clustered":0.3315786123275757,"transformation":0.22148822247982025,"##ming":0.2053191363811493,"computation":0.059317439794540405,"fraction":0.020799869671463966,"quad":0.02236507274210453,"framework":0.06180252879858017,"##ent":0.009141631424427032,"machine":0.10105223953723907,"yong":0.06722568720579147,"cite":0.2748035192489624,"php":0.0894031897187233,"li":0.2729487419128418,"queue":0.12690459191799164,"statistics":0.2719656825065613,"date":0.18876324594020844,"data":0.5285845398902893,"theoretical":0.0708773136138916,"scaled":0.019312994554638863,"use":0.03121419996023178,"precision":0.00330102676525712,"transforms":0.0877813920378685,"integer":0.017946965992450714,"used":0.003457715269178152,"lab":0.08697095513343811,"space":0.2475978583097458,"##bility":0.262219101190567,"faster":0.30351680517196655,"pages":0.12208819389343262,"automation":0.0404137447476387,"ma":0.0330902598798275,"coarse":0.423259973526001,"publication":0.31155064702033997,"limit":0.17905783653259277,"host":0.13868455588817596,"publishers":0.08175834268331528,"links":0.030996542423963547,"tag":0.04301407188177109,"mechanisms":0.15385998785495758,"calculated":0.08702979981899261,"group":0.8860188722610474,"##ix":0.014491083100438118,"all":0.03328382968902588,"approximation":0.3126513659954071,"offset":0.3984887897968292,"resource":0.23692965507507324,"kind":0.17658595740795135,"author":0.1566951423883438,"##pace":0.48780226707458496,"format":0.23283644020557404,"cpu":0.03108060546219349,"published":0.2444043755531311,"lever":0.02239195629954338,"tool":0.4331250786781311,"##ity":0.17846646904945374,"important":0.15687747299671173,"sequence":0.054030273109674454,"vectors":0.10603637993335724,"##pro":0.20519708096981049,"task":0.18777167797088623,"202":0.10256083309650421,"1540":0.25140076875686646,"publisher":0.23968227207660675,"files":0.057460103183984756,"harvard":0.017889821901917458,"leverage":0.12450428307056427,"limitation":0.0906817838549614,"code":0.1487729251384735,"ling":0.02543904259800911,"scala":0.5106821060180664,"##duction":0.3057882785797119,"university":0.0628678947687149,"link":0.0021837931126356125,"##oop":0.09841788560152054,"platform":0.00939986016601324,"sql":0.2283647060394287,"aggregate":0.05906238406896591,"cao":0.3018849492073059,"times":0.8698575496673584,"transform":0.393524706363678,"database":0.38857758045196533,"computing":0.28701451420783997,"contributor":0.04325903207063675,"##4":0.030926279723644257,"array":0.021531732752919197,"department":0.04395014047622681,"value":0.46844154596328735,"sam":0.1434582620859146,"##bed":0.19366015493869781,"##ass":0.02482995018362999,"chen":0.041453514248132706,"process":0.07493870705366135,"sap":0.070747010409832,"qing":0.08823900669813156,"limited":0.060234684497117996,"groups":0.40332743525505066,"resources":0.07301589101552963,"performance":0.2596159279346466,"application":0.20166657865047455,"zach":0.12970992922782898,"zack":0.3764365315437317,"variable":0.09021075814962387,"attention":0.9343430995941162,"##set":0.26578354835510254,"timothy":0.09520494937896729,"zachary":0.3683413863182068,"##ser":0.17104506492614746},"dates":[{"kind":"Publication date","value":"2024-03-12"}],"source":"DSpace@MIT","title":"RITA: Group Attention is All You Need for Timeseries Analytics","related_items":[{"description":"Proceedings of the ACM on Management of Data","relationship":"host"}],"source_link":"https://dspace.mit.edu/handle/1721.1/154072","content_type":["Article"],"rights":[{"description":"Creative Commons Attribution","kind":"useAndReproduction"}],"publishers":[{"name":"Association for Computing Machinery (ACM)"}],"links":[{"url":"https://hdl.handle.net/1721.1/154072","kind":"Digital object URL","text":"Digital object URL"}],"contributors":[{"value":"Liang, Jiaming","kind":"author"},{"value":"Cao, Lei","kind":"author"},{"value":"Madden, Samuel","kind":"author"},{"value":"Ives, Zack","kind":"author"},{"value":"Li, Guoliang","kind":"author"},{"value":"Massachusetts Institute of Technology. Computer Science and Artificial Intelligence Laboratory","kind":"department"}],"timdex_record_id":"dspace:1721.1-154072"},"sort":[9.972086,1710201600000]},{"_index":"dspace-2026-02-09t19-23-02","_id":"dspace:1721.1-158189","_score":9.902208,"_source":{"summary":["Games have become one of the most popular mediums across cultures and ages and the use of educational games is growing. There is ample evidence that supports the benefits of using games for learning and assessment. However, we do not usually find games incorporated into educational environments. One of the main problems that teachers face is to actually know how students are interacting with the game as they cannot analyze properly the effect of the activity on the students. To improve this issue, we can use the data generated by the interaction of students with such educational games to analyze the sequences and errors by transforming raw data into meaningful sequences that are interpretable and actionable for teachers. In this study we use a data collection from our game Shadowspect and implement learning analytics with process and sequence mining techniques to generate two metrics that aim to help teachers make proper assessment and better understand the process."],"timdex_provenance":{"source":"dspace","run_date":"2026-04-15","run_id":"a816f3dc-51ac-7e5f-cec8-1086ffc54274_861de409-c771-2e2c-c416-93c81a0885e3","run_record_offset":544},"languages":["en"],"citation":"Games have become one of the most popular mediums across cultures and ages and the use of educational games is growing. There is ample evidence that supports the benefits of using games for learning and assessment. However, we do not usually find games incorporated into educational environments. One of the main problems that teachers face is to actually know how students are interacting with the game as they cannot analyze properly the effect of the activity on the students. To improve this issue, we can use the data generated by the interaction of students with such educational games to analyze the sequences and errors by transforming raw data into meaningful sequences that are interpretable and actionable for teachers. In this study we use a data collection from our game Shadowspect and implement learning analytics with process and sequence mining techniques to generate two metrics that aim to help teachers make proper assessment and better understand the process.","file_formats":["application/pdf"],"identifiers":[{"value":"978-1-4503-8850-4","kind":"isbn"},{"value":"https://hdl.handle.net/1721.1/158189","kind":"uri"},{"value":"PUBLISHER_POLICY","kind":"mitlicense"}],"format":"electronic resource","embedding_full_record":{"authored":0.11171484738588333,"inform":0.07255442440509796,"interpreting":0.03647453337907791,"ps":0.005929179489612579,"objects":0.02500423789024353,"##i":0.0611104853451252,"##m":0.2903828024864197,"sequencing":0.4348330497741699,"objective":0.03336489945650101,"analyzing":0.3499673902988434,"evaluation":0.20522257685661316,"properly":0.1459272801876068,"identification":0.033479999750852585,"contribution":0.01887861080467701,"stats":0.09306534379720688,"retrieval":0.01181097887456417,"##ancy":0.010136660188436508,"##x":0.2269906997680664,"understanding":0.10651076585054398,"##ances":0.30549976229667664,"publishing":0.32336902618408203,"knowledge":0.018540158867836,"ac":0.39276131987571716,"using":0.2763674557209015,"gomez":0.31379804015159607,"impact":0.0938810482621193,"raw":0.3753768503665924,"analysis":0.3560086488723755,"benefit":0.43210986256599426,"miners":0.337857186794281,"exam":0.17718879878520966,"cultural":0.05665942281484604,"cognitive":0.08811827749013901,"interpretation":0.07180982083082199,"domain":0.1549099236726761,"processing":0.07420726120471954,"institute":0.29838353395462036,"educators":0.39247798919677734,"multicultural":0.10444344580173492,"object":0.23282763361930847,"lessons":0.11944762617349625,"mined":0.4275180399417877,"statistical":0.23687191307544708,"ru":0.29161062836647034,"conference":0.2543249726295471,"nintendo":0.10666655749082565,"activity":0.3405604362487793,"##pe":0.46233099699020386,"experiments":0.021003874018788338,"students":0.5349224805831909,"instructional":0.4845876693725586,"cited":0.22560502588748932,"proven":0.34145405888557434,"collecting":0.16747687757015228,"miner":0.3386409282684326,"##iling":0.11102477461099625,"into":0.06351584941148758,"citations":0.2935464382171631,"journal":0.1311558336019516,"are":0.05458195134997368,"does":0.01850234903395176,"popularity":0.12677578628063202,"mit":0.5141494870185852,"supports":0.046547017991542816,"[":0.06649395823478699,"campos":0.07785928249359131,"popular":0.31602704524993896,"embedded":0.17472168803215027,"policy":0.3020879030227661,"_":0.02083037793636322,"mine":0.43471288681030273,"quiz":0.04192153736948967,"ce":0.11771376430988312,"languages":0.12573130428791046,"learn":0.4235273003578186,"analyzed":0.007118157111108303,"dept":0.08346915990114212,"##able":0.11120790243148804,"simulations":0.19189123809337616,"advantages":0.20628879964351654,"pearson":0.13936747610569,"taught":0.05461912974715233,"metric":0.39921075105667114,"##ance":0.3666025996208191,"technological":0.18885508179664612,"##ing":0.039647892117500305,"analytic":0.14932315051555634,"supported":0.11522067338228226,"publications":0.01442677155137062,"incorporation":0.2431659698486328,"##re":0.07139471918344498,"evidence":0.4173656404018402,"questions":0.011319471523165703,"##and":0.07902032136917114,"language":0.21432532370090485,"run":0.18819546699523926,"source":0.31541597843170166,"incorporate":0.16894882917404175,"do":0.11114909499883652,"graphics":0.062409888952970505,"research":0.30500859022140503,"ds":0.533031702041626,"meaningful":0.4361054301261902,"instructors":0.16356335580348969,"analytics":0.43179941177368164,"assessment":0.5538440346717834,"afforded":0.13461272418498993,"158":0.3199150860309601,"school":0.49720025062561035,"##16":0.2162417471408844,"generated":0.14735518395900726,"incorporated":0.35746535658836365,"##18":0.12306170910596848,"##19":0.05840113013982773,"legal":0.03789589926600456,"tim":0.47694188356399536,"implement":0.1943490356206894,"cambridge":0.048772480338811874,"helpful":0.08717194944620132,"ict":0.03267231211066246,"ur":0.23801246285438538,"generate":0.20354785025119781,"ed":0.31153371930122375,"disadvantage":0.0028321880381554365,"##point":0.001673375372774899,"educational":0.78932785987854,"studying":0.03401067107915878,"chess":0.02548692561686039,"test":0.059046849608421326,"widely":0.07516292482614517,"shade":0.13138581812381744,"©":0.12972545623779297,"collection":0.30679118633270264,"8th":0.1198163628578186,"article":0.24797941744327545,"wiley":0.02149645984172821,"mines":0.3922884464263916,"improving":0.04162115603685379,"##27":0.011645765043795109,"beneficial":0.29368293285369873,"cultures":0.15930457413196564,"citing":0.09027329832315445,"playing":0.011787965893745422,"support":0.26477447152137756,"useful":0.22321324050426483,"gameplay":0.19145962595939636,"benefits":0.5389761328697205,"##ct":0.23562310636043549,"formats":0.12598708271980286,"analytical":0.2349443882703781,"sources":0.08444824069738388,"sequential":0.2814575731754303,"importance":0.09424101561307907,"isbn":0.26628321409225464,"mass":0.07872864603996277,"for":0.10822021216154099,"edition":0.043491512537002563,"proper":0.001231851987540722,"learning":0.6880468726158142,"generating":0.14192336797714233,"training":0.04012330248951912,"medium":0.41289234161376953,"video":0.14952534437179565,"##uca":0.30218377709388733,"content":0.3093835711479187,"random":0.09319355338811874,"psychology":0.10861583054065704,"sourced":0.06421579420566559,"teachers":0.6787165999412537,"authorship":0.07434213161468506,"978":0.28119874000549316,"incorporating":0.10835997760295868,"digital":0.3075924217700958,"enhancing":0.030547121539711952,"summary":0.026079442352056503,"citation":0.3735676109790802,"teach":0.28874754905700684,"##media":0.061361148953437805,"reading":0.08759767562150955,"technology":0.12232235074043274,"##51":0.006331366952508688,"better":0.0582471564412117,"##de":0.40035462379455566,"1721":0.2831958532333374,"environment":0.26946184039115906,"pdf":0.31581032276153564,"interpret":0.2955525815486908,"publish":0.17918218672275543,"analyst":0.1250784695148468,"contributors":0.09657818078994751,"hd":0.008604977279901505,"86":0.01000616792589426,"college":0.050413504242897034,"play":0.01875738613307476,"copyright":0.5497828125953674,"education":0.7968348860740662,"shadow":0.4928377568721771,"ecosystem":0.16919609904289246,"simulation":0.1479293704032898,"comparative":0.3421769440174103,"interactive":0.27583298087120056,"collected":0.21325601637363434,"program":0.05510478466749191,"type":0.03760179877281189,"improved":0.10908067971467972,"##ifier":0.12060028314590454,"problem":0.21354269981384277,"collections":0.09795517474412918,"massachusetts":0.45638012886047363,"games":0.8594752550125122,"gamer":0.19051086902618408,"action":0.06470873206853867,"id":0.3132678270339966,"text":0.06598370522260666,"proof":0.04040389880537987,"##nse":0.08105820417404175,"val":0.01527381781488657,"method":0.07769404351711273,"##lice":0.1268341988325119,"testing":0.1405354142189026,"lesson":0.22172845900058746,"understand":0.16448350250720978,"educating":0.18005996942520142,"classroom":0.532699704170227,"handle":0.01546946819871664,"intelligence":0.03877349570393562,"seoul":0.030209532007575035,"afford":0.37486833333969116,"schools":0.37638598680496216,"anal":0.2316465675830841,"analyze":0.3828655779361725,"shadows":0.530354917049408,"math":0.1372343748807907,"je":0.1298801302909851,"classrooms":0.03858708217740059,"valuable":0.03767019510269165,"become":0.08132227510213852,"authors":0.061796609312295914,"participation":0.057052500545978546,"study":0.30709829926490784,"linguistics":0.006930631585419178,"jo":0.029806027188897133,"methods":0.14378832280635834,"ping":0.039579395204782486,"martinez":0.33740949630737305,"##iente":0.21659237146377563,"teaching":0.588069498538971,"1086":0.12468632310628891,"sequences":0.4480733871459961,"yoon":0.2866777777671814,"educator":0.12606795132160187,"file":0.08606069535017014,"rights":0.17952580749988556,"writing":0.15379150211811066,"electronic":0.2117549180984497,"gaming":0.627409815788269,"##ifiers":0.10449839383363724,"explore":0.0036265270318835974,"homework":0.13286109268665314,"implementing":0.06343081593513489,"##mine":0.2529478371143341,"curriculum":0.23654107749462128,"intellectual":0.004632654134184122,"transformation":0.008434533141553402,"##games":0.35754117369651794,"gathering":0.11766980588436127,"help":0.13427484035491943,"site":0.013112440705299377,"ebook":0.004344046115875244,"assess":0.25329238176345825,"##ent":0.05052437633275986,"learners":0.34589844942092896,"culture":0.11348586529493332,"instruction":0.09252434968948364,"yong":0.040066447108983994,"cite":0.27889519929885864,"statistics":0.21910452842712402,"date":0.1387467086315155,"##ifying":0.012424829415977001,"##gami":0.09016755223274231,"data":0.6263949871063232,"##game":0.209828183054924,"environments":0.20021001994609833,"use":0.4176364839076996,"subject":0.15579204261302948,"dice":0.007726054172962904,"main":0.0211870726197958,"used":0.3526446521282196,"##ball":0.006172154098749161,"space":0.09478219598531723,"##emy":0.07577776908874512,"growing":0.17136751115322113,"academic":0.3801301419734955,"publication":0.3587958514690399,"##ip":0.20192472636699677,"implemented":0.1672244518995285,"publishers":0.25085991621017456,"assessing":0.12981194257736206,"international":0.1794189214706421,"offset":0.31560638546943665,"resource":0.3314530849456787,"kind":0.3642336130142212,"author":0.17650648951530457,"##pace":0.4614490866661072,"format":0.2339111566543579,"mining":0.6628022193908691,"published":0.3178688883781433,"literacy":0.17701704800128937,"important":0.03583519533276558,"sequence":0.6889362931251526,"license":0.08273540437221527,"effects":0.05309068784117699,"professor":0.006909577641636133,"##pro":0.22111502289772034,"eds":0.004061833955347538,"improve":0.263774573802948,"techniques":0.24114985764026642,"effect":0.188566654920578,"publisher":0.3763745129108429,"collect":0.15495893359184265,"harvard":0.036764759570360184,"errors":0.2900559604167938,"problems":0.2617033123970032,"game":0.915076732635498,"patent":0.07109424471855164,"student":0.4404866099357605,"##duction":0.2969920337200165,"purpose":0.21852804720401764,"mathematics":0.07209866493940353,"university":0.2602508068084717,"##ducted":0.04738771542906761,"manuel":0.17960745096206665,"interact":0.1939513236284256,"why":0.18151643872261047,"technique":0.10399332642555237,"media":0.3123375177383423,"error":0.28253480792045593,"textbooks":0.005854554940015078,"interactions":0.2444179207086563,"integrated":0.20436137914657593,"aggregate":0.03278617933392525,"451":0.06189008429646492,"effective":0.12966758012771606,"##ference":0.002658629324287176,"database":0.05165565386414528,"teacher":0.6446557641029358,"pedro":0.03662606328725815,"##yse":0.01469529140740633,"##8":0.053271543234586716,"studies":0.24162931740283966,"playground":0.018837811425328255,"department":0.049927953630685806,"value":0.5369448661804199,"tufts":0.033345699310302734,"process":0.36068451404571533,"assessments":0.3583606779575348,"advantage":0.09778598695993423,"implementation":0.15603342652320862,"eighth":0.21325883269309998,"rpg":0.19151069223880768,"resources":0.2295980453491211,"korean":0.04287691414356232,"application":0.036054130643606186,"activities":0.12323014438152313,"ecosystems":0.18487904965877533,"interaction":0.39692777395248413,"uses":0.13755731284618378,"##cultural":0.019624974578619003,"timothy":0.06808241456747055,"methodology":0.1357400119304657,"infringement":0.026672257110476494,"teaser":0.017070351168513298},"dates":[{"kind":"Publication date","value":"2020-10-21"}],"source":"DSpace@MIT","title":"Exploring the Affordances of Sequence Mining in Educational Games","source_link":"https://dspace.mit.edu/handle/1721.1/158189","content_type":["Article"],"rights":[{"description":"Article is made available in accordance with the publisher's policy and may be subject to US copyright law. Please refer to the publisher's site for terms of use.","kind":"useAndReproduction"}],"publishers":[{"name":"ACM|Eighth International Conference on Technological Ecosystems for Enhancing Multiculturality"}],"links":[{"url":"https://hdl.handle.net/1721.1/158189","kind":"Digital object URL","text":"Digital object URL"}],"contributors":[{"value":"Gomez, Manuel J.","kind":"author"},{"value":"Ruip?rez-Valiente, Jos? A.","kind":"author"},{"value":"Martinez, Pedro A.","kind":"author"},{"value":"Kim, Yoon Jeon","kind":"author"},{"value":"Massachusetts Institute of Technology. Program in Comparative Media Studies/Writing","kind":"department"}],"timdex_record_id":"dspace:1721.1-158189"},"sort":[9.902208,1603238400000]},{"_index":"dspace-2026-02-09t19-23-02","_id":"dspace:1721.1-158299","_score":9.895651,"_source":{"summary":["Background/Objective: Subarachnoid hemorrhage (SAH) is associated with high morbidity and mortality rates, necessitating prognostic algorithms to guide decisions. Our study evaluates the use of machine learning (ML) models for predicting 1-month and 1-year mortality among SAH patients using national electronic health records (EHR) system. Methods: Retrospective cohort of 29,274 SAH patients, identified through national EHR system from January 2017 to December 2022, was analyzed, with mortality data obtained from central civil registration system in Türkiye. Variables included (n = 102) pre- (n = 65) and post-admission (n = 37) data, such as patient demographics, clinical presentation, comorbidities, laboratory results, and complications. We employed logistic regression (LR), decision trees (DTs), random forests (RFs), and artificial neural networks (ANN). Model performance was evaluated using area under the curve (AUC), average precision, and accuracy. Feature significance analysis was conducted using LR. Results: The average age was 56.23 ± 16.45 years (47.8% female). The overall mortality rate was 22.8% at 1 month and 33.3% at 1 year. One-month mortality increased from 20.9% to 24.57% (p < 0.001), and 1-year mortality rose from 30.85% to 35.55% (p < 0.001) in the post-COVID period compared to the pre-COVID period. For 1-month mortality prediction, the ANN, LR, RF, and DT models achieved AUCs of 0.946, 0.942, 0.931, and 0.916, with accuracies of 0.905, 0.901, 0.893, and 0.885, respectively. For 1-year mortality, the AUCs were 0.941, 0.927, 0.926, and 0.907, with accuracies of 0.884, 0.875, 0.861, and 0.851, respectively. Key predictors of mortality included age, cardiopulmonary arrest, abnormal laboratory results (such as abnormal glucose and lactate levels) at presentation, and pre-existing comorbidities. Incorporating post-admission features (n = 37) alongside pre-admission features (n = 65) improved model performance for both 1-month and 1-year mortality predictions, with average AUC improvements of 0.093 ± 0.011 and 0.089 ± 0.012, respectively. Conclusions: Our study demonstrates the effectiveness of ML models in predicting mortality in SAH patients using big data. LR models’ robustness, interpretability, and feature significance analysis validate its importance. Including post-admission data significantly improved all models’ performances. Our results demonstrate the utility of big data analytics in population-level health outcomes studies."],"timdex_provenance":{"source":"dspace","run_date":"2026-03-01","run_id":"3b5fabfb-9ee6-7cac-94a6-3b70ba14679d_7abd3cf1-9ede-4d69-259a-9fc8edfb66a5","run_record_offset":756},"citation":"Khaniyev, T.; Cekic, E.; Gecici, N.N.; Can, S.; Ata, N.; Ulgu, M.M.; Birinci, S.; Isikay, A.I.; Bakir, A.; Arat, A.; et al. Predicting Mortality in Subarachnoid Hemorrhage Patients Using Big Data and Machine Learning: A Nationwide Study in Türkiye. J. Clin. Med. 2025, 14, 1144.","file_formats":["application/pdf"],"identifiers":[{"value":"https://hdl.handle.net/1721.1/158299","kind":"uri"},{"value":"PUBLISHER_CC","kind":"mitlicense"}],"format":"electronic resource","embedding_full_record":{"projections":0.16632112860679626,"##b":0.05230620875954628,"##arm":0.0035105280112475157,"##c":0.24454280734062195,"year":0.019565172493457794,"##mit":0.012334163300693035,"##h":0.47803592681884766,"##mir":0.12620405852794647,"accuracy":0.395274817943573,"##i":0.15243813395500183,"##ara":0.2842504382133484,"evaluation":0.10798971354961395,"analyzing":0.0022341147996485233,"score":0.051702748984098434,"##r":0.35307031869888306,"##t":0.12134937196969986,"outcomes":0.2695155143737793,"##u":0.049391984939575195,"##ancy":0.3127010762691498,"record":0.08388973772525787,"##x":0.22159112989902496,"electronically":0.16011138260364532,"##y":0.06583753228187561,"iqbal":0.061531808227300644,"evaluated":0.14186866581439972,"calculate":0.09864078462123871,"diagnostic":0.013269064016640186,"##mia":0.01303375605493784,"deaths":0.24058254063129425,"aa":0.015494641847908497,"ah":0.34629765152931213,"ai":0.2954539358615875,"ak":0.024219989776611328,"artery":0.03326644003391266,"analysis":0.2983715236186981,"accurately":0.03774131461977959,"population":0.1571645885705948,"1":0.21674297749996185,"au":0.6549807786941528,"institute":0.16446995735168457,"evaluating":0.052893009036779404,"##hort":0.07676730304956436,"ba":0.43012535572052,"cardiac":0.2401297688484192,"object":0.0370510071516037,"@":0.005651675630360842,"average":0.49194079637527466,"statistical":0.2494998425245285,"forest":0.15683437883853912,"achieve":0.005904712248593569,"bi":0.35660746693611145,"cited":0.13297542929649353,"proven":0.20939628779888153,"journal":0.34791651368141174,"citations":0.28663575649261475,"systems":0.0032214955426752567,"civil":0.25621160864830017,"national":0.1505037546157837,"hana":0.39562490582466125,"ce":0.45312726497650146,"abd":0.40607330203056335,"glucose":0.1750715672969818,"learn":0.14140279591083527,"e":0.06494157016277313,"h":0.23227490484714508,"cl":0.1858881115913391,"j":0.038515374064445496,"medicine":0.009021414443850517,"l":0.6030293107032776,"co":0.07803215086460114,"blood":0.43084508180618286,"forests":0.08824295550584793,"predictions":0.36986762285232544,"##ance":0.30435219407081604,"under":0.13703273236751556,"analytic":0.14022651314735413,"publications":0.10213525593280792,"acc":0.13940377533435822,"##ar":0.06386695057153702,"##met":0.3865136206150055,"##iology":0.014255529269576073,"##ay":0.24503476917743683,"##kam":0.03701021894812584,"##eva":0.03103378415107727,"##rom":0.01791592314839363,"ds":0.513344407081604,"analytics":0.42551371455192566,"dt":0.26410892605781555,"post":0.36331528425216675,"##oid":0.07297186553478241,"##ah":0.10370393097400665,"tim":0.5072606801986694,"##aj":0.1095159724354744,"female":0.11214327812194824,"predicted":0.35759443044662476,"computational":0.11025125533342361,"area":0.15256625413894653,"eh":0.43072018027305603,"ek":0.0909225195646286,"em":0.0642942264676094,"modeled":0.016392823308706284,"er":0.03697817027568817,"article":0.12290456146001816,"et":0.12192264944314957,"month":0.36643633246421814,"##bf":0.1749231070280075,"useful":0.10308419913053513,"##cs":0.007548184599727392,"neural":0.3058636486530304,"sources":0.04739272594451904,"analytical":0.0028651917818933725,"importance":0.012655545957386494,"ems":0.01535289641469717,"rashid":0.013404427096247673,"fatal":0.008976215496659279,"random":0.29281410574913025,"rate":0.41003739833831787,"##ch":0.22765636444091797,"##ci":0.17997576296329498,"authorship":0.06749184429645538,"sin":0.42452678084373474,"projection":0.034897610545158386,"ge":0.324842631816864,"##rial":0.04814263805747032,"effectiveness":0.4123634994029999,"digital":0.2868342399597168,"somali":0.04801568761467934,"citation":0.32789114117622375,"females":0.16772814095020294,"perform":0.06668628007173538,"retrospective":0.4028434753417969,"improvement":0.05438167229294777,"stroke":0.19376979768276215,"kahn":0.20055118203163147,"significance":0.358489066362381,"##de":0.4390100836753845,"existing":0.01791161671280861,"pdf":0.28170275688171387,"2017":0.11970996856689453,"management":0.1425808072090149,"regression":0.40131354331970215,"publish":0.21018725633621216,"interpret":0.15938878059387207,"ha":0.16127489507198334,"achieved":0.1011437326669693,"analyst":0.06333158165216446,"##ura":0.06889738887548447,"contributors":0.004226372577250004,"hd":0.05384458974003792,"age":0.5621817111968994,"big":0.6402850151062012,"##ev":0.2954094707965851,"bleeding":0.5886930227279663,"##man":0.21447183191776276,"simulation":0.04906997084617615,"rib":0.07759197056293488,"##fc":0.0781746357679367,"##fe":0.2560829222202301,"improved":0.23197069764137268,"##ifier":0.10883207619190216,"##em":0.20133526623249054,"model":0.5794802904129028,"ic":0.05545654147863388,"id":0.20659244060516357,"algorithm":0.3113534450531006,"nas":0.005899539217352867,"period":0.12936601042747498,"ik":0.0576590932905674,"il":0.33032044768333435,"large":0.18706761300563812,"##aging":0.04541703686118126,"handle":0.012739480473101139,"##ache":0.05308551341295242,"##gb":0.005723275244235992,"unpublished":0.0038874230813235044,"journals":0.05092422664165497,"intelligence":0.005245747976005077,"system":0.13227279484272003,"interval":0.03856896609067917,"singh":0.07438074797391891,"evaluate":0.19004231691360474,"authors":0.1836526244878769,"women":0.14856216311454773,"algorithms":0.331506609916687,"curve":0.3124798834323883,"##opus":0.09652981162071228,"ain":0.027160748839378357,"##rin":0.29127711057662964,"##ha":0.03973250836133957,"##och":0.018960464745759964,"valid":0.06278664618730545,"prevalence":0.14683181047439575,"file":0.06428848206996918,"##gl":0.11080123484134674,"electronic":0.352308988571167,"##ability":0.11401300877332687,"predicting":0.5925135016441345,"outcome":0.24933679401874542,"##gu":0.20703540742397308,"##age":0.25658461451530457,"cnn":0.013659878633916378,"robust":0.2831318974494934,"##bid":0.12823280692100525,"sloan":0.5183160305023193,"health":0.218348428606987,"##id":0.23893149197101593,"##hi":0.14989672601222992,"machine":0.6243991255760193,"cite":0.18816444277763367,"##hs":0.08702109009027481,"##iy":0.15335381031036377,"##sis":0.009736447595059872,"use":0.1527697592973709,"precision":0.3238876163959503,"##tens":0.013351826928555965,"lac":0.2656191289424896,"##il":0.27462899684906006,"automation":0.035713497549295425,"##im":0.21472427248954773,"ma":0.16568388044834137,"##io":0.0605204775929451,"publication":0.38499826192855835,"##ip":0.24206888675689697,"nes":0.35393983125686646,"calculated":0.038421448320150375,"ml":0.6648946404457092,"##ix":0.0331592857837677,"##cic":0.19616267085075378,"##roid":0.03305206075310707,"level":0.020541323348879814,"##ka":0.20842552185058594,"author":0.19496269524097443,"##ema":0.015305300243198872,"conducted":0.08601797372102737,"diagnosis":0.08082875609397888,"admission":0.28034618496894836,"heart":0.1058012843132019,"##ity":0.10505462437868118,"clinical":0.34713074564933777,"na":0.2210163027048111,"202":0.060532864183187485,"arrests":0.09212909638881683,"improve":0.13236480951309204,"background":0.058756276965141296,"prediction":0.45296284556388855,"monthly":0.18773320317268372,"ni":0.21139340102672577,"##che":0.005862046964466572,"ahmed":0.16721901297569275,"code":0.18453297019004822,"university":0.07047976553440094,"med":0.03848196938633919,"##li":0.021427826955914497,"##mission":0.13669639825820923,"##dis":0.04681935906410217,"effective":0.3574286997318268,"investigator":0.017481621354818344,"predict":0.5668691992759705,"department":0.07154864817857742,"ann":0.43681082129478455,"determine":0.040841344743967056,"rates":0.23365284502506256,"deviation":0.06832551956176758,"##ml":0.1505689024925232,"manuscript":0.09222015738487244,"##gno":0.2909998297691345,"##emia":0.171987846493721,"nhs":0.12031684815883636,"machines":0.1952805519104004,"authored":0.0821838527917862,"accurate":0.32582446932792664,"mustafa":0.4041937589645386,"objective":0.1871785670518875,"estimate":0.183462455868721,"publishing":0.3290919363498688,"models":0.5160419344902039,"##cies":0.06955371797084808,"using":0.1767246425151825,"forecast":0.36517229676246643,"##itis":0.0453786626458168,"##no":0.1579941362142563,"abnormal":0.082566037774086,"rf":0.35728657245635986,"##ipe":0.009560646489262581,"sub":0.571846067905426,"##rak":0.002446502447128296,"##tek":0.0066922251135110855,"##rah":0.2297580987215042,"##stic":0.17873741686344147,"##des":0.12568220496177673,"networks":0.1056860163807869,"sa":0.7866416573524475,"##vid":0.2161475270986557,"goddard":0.03454362228512764,"ara":0.3142560124397278,"##or":0.20078785717487335,"##ation":0.03858928382396698,"mir":0.05212758108973503,"mit":0.5941270589828491,"u2":0.0416477806866169,"email":0.0068123964592814445,"##ages":0.20229534804821014,"su":0.2763376832008362,"variables":0.26158690452575684,"stat":0.12981314957141876,"complications":0.2975848913192749,"decision":0.22195309400558472,"ottoman":0.04600246623158455,"one":0.04612800478935242,"cardiovascular":0.16287386417388916,"asa":0.09020794183015823,"simulations":0.09682819247245789,"##00":0.1797279417514801,"##01":0.30066755414009094,"automated":0.2766290605068207,"##pu":0.1280541718006134,"metric":0.015509288758039474,"associated":0.27799972891807556,"mortality":0.6959043741226196,"khan":0.30453670024871826,"calculation":0.107974573969841,"##rb":0.03615947812795639,"medical":0.2755252718925476,"##rh":0.3517885208129883,"##rk":0.10346924513578415,"run":0.23476608097553253,"source":0.2159099131822586,"research":0.3148193061351776,"##can":0.24560831487178802,"ata":0.4030856788158417,"ich":0.07540832459926605,"presentation":0.20356157422065735,"features":0.07803194969892502,"hai":0.024025363847613335,"##14":7.299255230464041E-4,"158":0.30670568346977234,"school":0.04307673126459122,"ul":0.3921319544315338,"results":0.22956570982933044,"ur":0.20782405138015747,"estimates":0.1630251109600067,"pre":0.221347838640213,"significant":0.3565692603588104,"pro":0.19088375568389893,"bleed":0.5407309532165527,"modelling":0.11252636462450027,"improving":0.004977360833436251,"mls":0.2530680298805237,"##28":0.04566890373826027,"##29":0.10980857908725739,"##ede":0.03419176861643791,"overall":0.1050630584359169,"citing":0.019071675837039948,"##sa":0.07783172279596329,"aus":0.0036318765487521887,"##tan":0.07317749410867691,"records":0.30689412355422974,"recording":0.009464900940656662,"learning":0.4035013020038605,"##hir":0.27140116691589355,"##ogist":0.0053257509134709835,"##hin":0.28470250964164734,"central":0.16844001412391663,"##cans":0.05323408916592598,"##bara":0.00634216982871294,"1717":0.0338951013982296,"summary":0.10823003947734833,"##ika":0.3981630206108093,"registry":0.07023851573467255,"disease":0.015091711655259132,"estimated":0.16058389842510223,"##ur":0.15649960935115814,"artificial":0.41761937737464905,"1721":0.3706821799278259,"curves":0.052967317402362823,"##46":0.006801373325288296,"watson":0.013531357049942017,"medicare":0.09560615569353104,"stem":0.05624548718333244,"modeling":0.31109747290611267,"##ova":0.07349615544080734,"aziz":0.005394640378654003,"multi":0.10017853230237961,"hem":0.694517970085144,"mor":0.20593836903572083,"identified":0.09866124391555786,"##plication":0.12475156784057617,"massachusetts":0.003105104435235262,"##nse":0.045524321496486664,"como":0.11996207386255264,"efficiency":0.029026998206973076,"method":0.016597453504800797,"nationally":0.1904960572719574,"##lice":0.09225025027990341,"conclusions":0.08770733326673508,"admissions":0.09253038465976715,"vascular":0.05590091645717621,"nationwide":0.5212215781211853,"registration":0.0963604524731636,"card":0.28911858797073364,"study":0.38272571563720703,"log":0.4024736285209656,"methods":0.12340947240591049,"##hes":0.07627758383750916,"variability":0.01014069002121687,"commons":0.13547077775001526,"feature":0.22026239335536957,"##raine":0.014788000844419003,"##mans":0.0011243533808737993,"##ifiers":0.062157101929187775,"hepatitis":0.03699856996536255,"performed":0.08980035781860352,"##mann":0.027369815856218338,"##ors":0.1712764948606491,"##yev":0.058063339442014694,"incidence":0.11099553108215332,"statistics":0.28292563557624817,"date":0.13626226782798767,"data":0.6337661147117615,"arrest":0.2982217073440552,"##kit":0.09680308401584625,"##kir":0.2984657883644104,"used":0.09726621210575104,"space":0.12431018799543381,"##nor":0.05248469114303589,"percentage":0.2345493882894516,"publishers":0.025517236441373825,"##kic":0.3642825186252594,"tag":0.22373168170452118,"##fusion":0.04936373606324196,"offset":0.32926884293556213,"resource":0.16307388246059418,"##ids":0.10927924513816833,"kind":0.06410723179578781,"patients":0.3759303689002991,"survival":0.19112639129161835,"##pace":0.5045238733291626,"ill":0.132027730345726,"format":0.09169566631317139,"tree":0.06653709709644318,"published":0.33131593465805054,"##idi":0.08418503403663635,"estimation":0.01811029762029648,"cochrane":0.01463786419481039,"##pro":0.09827270358800888,"turkish":0.05832987651228905,"publisher":0.23240706324577332,"autopsy":0.10372350364923477,"abdul":0.018674656748771667,"death":0.5411603450775146,"##duction":0.3224498927593231,"values":0.1407640129327774,"scale":0.009744948707520962,"##han":0.018819915130734444,"##lio":0.27815723419189453,"network":0.11002799868583679,"##0":0.02338423579931259,"projected":0.03369615972042084,"database":0.175077885389328,"pneumonia":0.015555204823613167,"patient":0.42011523246765137,"studies":0.2248029261827469,"##9":0.08403560519218445,"hospital":0.10944396257400513,"value":0.5598036646842957,"pmid":0.04975513368844986,"efficacy":0.1757708638906479,"performance":0.34094658493995667,"##istic":0.16973215341567993,"variable":0.15459512174129486,"clinic":0.012469998560845852,"##ona":0.11275823414325714,"timothy":0.09422598034143448,"demographics":0.14041739702224731},"dates":[{"kind":"Publication date","value":"2025-02-10"}],"source":"DSpace@MIT","title":"Predicting Mortality in Subarachnoid Hemorrhage Patients Using Big Data and Machine Learning: A Nationwide Study in Türkiye","related_items":[{"description":"Journal of Clinical Medicine","relationship":"host"}],"source_link":"https://dspace.mit.edu/handle/1721.1/158299","content_type":["Article"],"rights":[{"description":"Creative Commons Attribution","kind":"useAndReproduction"}],"publishers":[{"name":"Multidisciplinary Digital Publishing Institute"}],"links":[{"url":"https://hdl.handle.net/1721.1/158299","kind":"Digital object URL","text":"Digital object URL"}],"contributors":[{"value":"Khaniyev, Taghi","kind":"author"},{"value":"Cekic, Efecan","kind":"author"},{"value":"Gecici, Neslihan Nisa","kind":"author"},{"value":"Can, Sinem","kind":"author"},{"value":"Ata, Naim","kind":"author"},{"value":"Ulgu, Mustafa Mahir","kind":"author"},{"value":"Birinci, Suayip","kind":"author"},{"value":"Isikay, Ahmet Ilkay","kind":"author"},{"value":"Bakir, Abdurrahman","kind":"author"},{"value":"Arat, Anil","kind":"author"},{"value":"Hanalioglu, Sahin","kind":"author"},{"value":"Sloan School of Management","kind":"department"}],"timdex_record_id":"dspace:1721.1-158299"},"sort":[9.895651,1739145600000]},{"_index":"dspace-2026-02-09t19-23-02","_id":"dspace:1721.1-152921","_score":9.891104,"_source":{"summary":["Digital Health Systems could play a pivotal role in improving heathcare if a critical mass of reliable data were obtained (remote health) and subjected to dynamic pattern analyses to reveal (expose?) underlying key physiological performance indicators. The latter could help medical professionals (at point of care) or remote healthcare (home) practitioners with predictive and prescriptive analytics to aid in making better data-informed decisions or feed/update decision support systems."],"timdex_provenance":{"source":"dspace","run_date":"2026-04-10","run_id":"1e989aeb-a718-2082-6d5c-ab65094616e7_39c4774c-cf18-aaa7-2606-ea3eaa1b94a8","run_record_offset":14},"languages":["en"],"citation":"Datta, Shoumen (2023-11-07): Healthcare, Clinical Research and Digital Health Systems. Presentation. https://dspace.mit.edu/handle/1721.1/152921","file_formats":["application/pdf"],"identifiers":[{"value":"https://hdl.handle.net/1721.1/152921","kind":"uri"}],"format":"electronic resource","embedding_full_record":{"authored":0.021231507882475853,"##script":0.347543329000473,"inform":0.21078716218471527,"##d":0.031994469463825226,"credible":0.06367392838001251,"objects":0.09067576378583908,"##i":0.07800138741731644,"remote":0.6263675689697266,"##l":0.11216314882040024,"dynamics":0.06913971155881882,"identification":0.2810859680175781,"contribution":0.0038984566926956177,"record":0.44620025157928467,"##x":0.365296334028244,"electronically":0.06588010489940643,"##ances":0.06315882503986359,"publishing":0.1899750679731369,"##cript":0.0950607880949974,"#":0.023600516840815544,"ai":0.07695913314819336,"indicators":0.35727792978286743,"analysis":0.273896187543869,"rd":0.03933202475309372,"domain":0.12960416078567505,"institute":0.33909276127815247,"object":0.279073029756546,"@":0.05482913926243782,"boston":0.037370506674051285,"statistical":0.11289884895086288,"role":0.3218716084957123,"document":0.08156663179397583,"cited":0.3284362554550171,"proven":0.37651151418685913,"##des":0.25199952721595764,"citations":0.381166011095047,"journal":0.1535976678133011,"systems":0.4937988221645355,"mit":0.5913366079330444,"##ded":0.18693938851356506,"key":0.13178260624408722,"email":0.10048474371433258,"_":0.09303927421569824,"cc":0.17693433165550232,"website":0.09146188944578171,"address":0.02669881470501423,"cf":0.01119350828230381,"d":0.23059701919555664,"decision":0.2111225575208664,"languages":0.12798775732517242,"dept":0.11548557877540588,"biomedical":0.1552218645811081,"##01":0.08990740031003952,"indices":0.1720534861087799,"automated":0.09897561371326447,"metric":0.18460829555988312,"ibm":0.023297712206840515,"information":0.20864345133304596,"##ance":0.3364950120449066,"##umen":0.4091958999633789,"analytic":0.21626640856266022,"##lth":0.11926168948411942,"publications":0.113625667989254,"medical":0.531481921672821,"##re":0.07620159536600113,"dh":0.01787944696843624,"project":0.06109234690666199,"##and":0.01892884634435177,"run":0.37288862466812134,"language":0.13804306089878082,"source":0.29686880111694336,"research":0.6393256783485413,"152":0.3527137041091919,"ds":0.678463876247406,"##21":0.28636670112609863,"analytics":0.44228553771972656,"presentation":0.36358001828193665,"##med":0.06819050759077072,"##19":0.011191751807928085,"tim":0.5981734991073608,"dynamic":0.42181938886642456,"cambridge":0.1421809047460556,"ea":0.08359898626804352,"ur":0.3618442714214325,"digit":0.5384813547134399,"tech":0.011527047492563725,"pre":0.13726957142353058,"eh":0.13065269589424133,"##care":0.2965044677257538,"patterns":0.3570670187473297,"##22":0.1043500006198883,"technologies":0.06107059121131897,"improving":0.20370076596736908,"exposing":0.18883471190929413,"labs":0.07689259201288223,"laboratory":0.2759990394115448,"spaces":0.10769324004650116,"citing":0.22183780372142792,"sho":0.41185659170150757,"support":0.05910578742623329,"useful":0.04586322233080864,"virtual":0.2263684719800949,"formats":0.2103085070848465,"analytical":0.13478077948093414,"sources":0.09934329241514206,"records":0.4017236530780792,"mass":0.2740211486816406,"roles":0.09182348847389221,"update":0.14084431529045105,"recording":0.11265017837285995,"title":0.12198717147111893,"172":0.047377776354551315,"##da":0.24166902899742126,"content":0.12285836786031723,"sourced":0.060372401028871536,"authorship":0.08446160703897476,"wellness":0.05383550748229027,"exposed":0.21673136949539185,"1718":4.009520635008812E-4,"##ta":0.36045384407043457,"digital":0.8953678607940674,"summary":0.13594719767570496,"registry":0.11244787275791168,"citation":0.4472592771053314,"technology":0.12647239863872528,"improvement":0.11178860813379288,"##51":0.0057396311312913895,"expose":0.34333717823028564,"home":0.06941477209329605,"##de":0.6347955465316772,"1722":0.04972529411315918,"1721":0.4354505240917206,"##46":0.12539514899253845,"pdf":0.2961193919181824,"##47":0.137250155210495,"referenced":0.016100231558084488,"infrastructure":0.01703060045838356,"publish":0.12169615179300308,"analyst":0.04762504994869232,"contributors":0.10967490077018738,"hd":0.12872764468193054,"physiological":0.2916363775730133,"medicare":0.26308920979499817,"practice":0.12892262637615204,"copyright":0.07650091499090195,"software":0.06992138922214508,"prefix":0.015080694109201431,"repository":0.08813498169183731,"tracking":0.1289379894733429,"improved":0.19488772749900818,"reliable":0.31316444277763367,"number":0.2531754672527313,"##ifier":0.13102199137210846,"massachusetts":0.5568485856056213,"##space":0.013618218712508678,"id":0.5719196796417236,"text":0.020465273410081863,"researchers":0.10590264201164246,"practitioner":0.09934240579605103,"index":0.12522438168525696,"handle":0.14286155998706818,"underlying":0.1462550163269043,"script":0.02959490939974785,"system":0.5517770648002625,"practitioners":0.22612595558166504,"issn":0.12583279609680176,"remotely":0.5158811807632446,"care":0.3793204128742218,"##opus":0.0276015792042017,"reliability":0.138273224234581,"pattern":0.354310005903244,"presentations":0.19809800386428833,"healthcare":0.6341591477394104,"file":0.21794889867305756,"bibliography":0.08343440294265747,"web":0.1171182245016098,"identity":0.19561034440994263,"rights":0.13054361939430237,"electronic":0.43816816806793213,"decisions":0.05112862214446068,"predicting":0.06075272709131241,"informed":0.256807804107666,"##ifiers":0.023352447897195816,"could":0.18057088553905487,"health":0.8315020203590393,"##id":0.015384525991976261,"help":0.0017953157657757401,"pivotal":0.3245539665222168,"cite":0.38022324442863464,"php":0.09588387608528137,"statistics":0.08501850813627243,"date":0.3444145917892456,"indicator":0.27064114809036255,"hospitals":0.25408586859703064,"codes":0.07792925834655762,"auto":0.5051999688148499,"reveal":0.12267738580703735,"data":0.5980324745178223,"##ive":0.20161914825439453,"use":0.06182742863893509,"##kit":0.01902262680232525,"nursing":0.003813118441030383,"lab":0.14069032669067383,"space":0.30397555232048035,"heath":0.35725051164627075,"reference":0.10468719899654388,"cloud":0.013644259423017502,"ma":0.1161927580833435,"##rner":8.823337848298252E-4,"dat":0.5755953788757324,"presented":0.0029659748543053865,"publication":0.37110626697540283,"links":0.11013282090425491,"tag":0.05531400442123413,"potential":0.08391561359167099,"##ix":0.027615690603852272,"offset":0.4230552911758423,"presenter":0.12793801724910736,"resource":0.3279263973236084,"kind":0.19884997606277466,"##pace":0.6371805667877197,"format":0.31088778376579285,"published":0.2846498489379883,"feed":0.06938833743333817,"clinical":0.6913189888000488,"##pro":0.2786668837070465,"202":0.22570493817329407,"improve":0.20908509194850922,"topic":0.0436699241399765,"files":0.02925705350935459,"harvard":0.06709406524896622,"code":0.3107832968235016,"critical":0.43122178316116333,"##duction":0.32044172286987305,"university":0.22702941298484802,"link":0.15726949274539948,"med":0.0865049660205841,"point":0.08619894832372665,"digitally":0.499701589345932,"database":0.2945125102996826,"contributor":0.04594521224498749,"patient":0.2433016151189804,"predict":0.27433881163597107,"##9":0.14443688094615936,"studies":0.027390746399760246,"hospital":0.343527615070343,"department":0.13150078058242798,"value":0.38764986395835876,"universal":0.24875178933143616,"tufts":0.10025160759687424,"##ass":0.03720395267009735,"initiative":0.03136167675256729,"disclosed":0.00625734543427825,"##atics":0.05680132657289505,"verified":0.006840330548584461,"resources":0.21792930364608765,"automatic":0.11520040035247803,"pmid":0.03865690529346466,"cyber":0.36444011330604553,"performance":0.3283030688762665,"application":0.12314873933792114,"##ls":0.0071022119373083115,"nhs":0.25356635451316833,"online":0.24914361536502838,"clinic":0.314358651638031,"##set":0.01912974752485752,"timothy":0.26817241311073303},"dates":[{"kind":"Publication date","value":"2023-11-07"}],"source":"DSpace@MIT","title":"Healthcare, Clinical Research and Digital Health Systems","source_link":"https://dspace.mit.edu/handle/1721.1/152921","content_type":["Presentation"],"rights":[{"description":"CC0 1.0 Universal","kind":"useAndReproduction"}],"links":[{"url":"https://hdl.handle.net/1721.1/152921","kind":"Digital object URL","text":"Digital object URL"}],"contributors":[{"value":"Datta, Shoumen","kind":"author"},{"value":"Massachusetts Institute of Technology. Auto-ID Laboratory","kind":"department"}],"timdex_record_id":"dspace:1721.1-152921"},"sort":[9.891104,1699315200000]},{"_index":"dspace-2026-02-09t19-23-02","_id":"dspace:1721.1-165055","_score":9.855363,"_source":{"summary":["Mounting concerns about safety and security have resulted in an intricate ecosystem system of\r\nguidelines, compliance measures, directives and policy reports for cybersecurity of all critical\r\ninfrastructure. The policy paradox is that the text form of policy documents is an impediment to\r\nthe implementation of policies and directives and creates potentially powerful opportunity costs.\r\nAs a general practice, guidelines, directives and policy documents are presented in text form,\r\npage-by-page and word-by-word all supported by figures, diagrams and tables as needed. By\r\ndefinition text obscures properties of both policy and system-target in terms of dynamic\r\nrelationships, feedback, “drill-down”, leads and lags, and so forth.\r\nThe challenge is to develop analytics for cybersecurity policy of cyber physical systems. We begin\r\nwith constructing (a) a structured system model of the system, in order to (b) identify major policydefined\r\nsystem-wide parameters, (c) situate system vulnerabilities, (d) map security requirements\r\nto security objectives, and (e) advance research on how system properties respond to diverse\r\npolicy controls for security of cyber physical systems.\r\nThis Project addresses the hard problem of policy-governed secure collaboration related to cyberphysical\r\nsecurity of critical infrastructure (focusing on a generic and fundamental feature, namely\r\nsmart grid of electric power systems). The purpose is to (a) reduce, if not eliminate barriers to full\r\nunderstanding of policy text as transmitted by the source, (b) explore system-wide or targeted\r\nimplications, (c) help contextualize generic directives for specific applications, and (d) facilitate\r\ncontingency analysis, as needed.\r\nThis Compilation is based on the Quarterly Research Reports submitted by MIT to the Cyber-\r\nPhysical Systems Organization of Vanderbilt University. The Compilation is the first of several\r\nReports highlighting the research process and products of the MIT Project on Policy Analytics for\r\nCybersecurity of Cyber-Physical Systems. Gaurav Agarwal [a.k.a. Gaurav], MIT alumnus, served\r\nas Lead Researcher for the Proof-of-Concept case presented here."],"timdex_provenance":{"source":"dspace","run_date":"2026-03-07","run_id":"cd0cdc78-ab33-1470-e6b7-b98a322f4971_61b5107d-953d-12a3-ee92-ef93984cdab5","run_record_offset":22},"languages":["en_US"],"citation":"Choucri, N. and Anaya, J. (2024). Policy analytics for Cybersecurity of cyber-Physical Systems. MIT Department of Political Science","file_formats":["application/pdf"],"identifiers":[{"value":"https://hdl.handle.net/1721.1/165055","kind":"uri"}],"subjects":[{"value":["Proof-of-concept, text-as-data, design structure matrix, metrics, network models, Cybersecurity Framework, C-I-A, security, privacy, security objectives and requirements, impact levels"],"kind":"Subject scheme not provided"}],"format":"electronic resource","embedding_full_record":{"projects":0.17903973162174225,"govern":0.018122175708413124,"##mit":0.08438833802938461,"objects":0.08451484888792038,"seismic":0.030874039977788925,"##i":0.05641346424818039,"##l":0.061056122183799744,"analyzing":0.07814662158489227,"##t":0.03525763005018234,"##v":0.2339586317539215,"record":0.1429898887872696,"##x":0.22493621706962585,"iqbal":0.012734001502394676,"##ances":0.08041682094335556,"##z":0.05900108069181442,"ab":0.07887619733810425,"ag":0.263523131608963,"documentation":0.3029804825782776,"impact":0.19157634675502777,"opportunity":0.18227754533290863,"analysis":0.5226325392723083,"submitted":0.2506049871444702,"science":0.1871064156293869,"domain":0.14785459637641907,"institute":0.32314467430114746,"object":0.26875248551368713,"boston":0.03059421479701996,"@":0.013631853275001049,"statistical":0.08711983263492584,"prove":0.12351904809474945,"scheme":0.240999236702919,"cited":0.2810979187488556,"##pile":0.1585104912519455,"proven":0.3622814416885376,"matrix":0.3385859429836273,"citations":0.35828909277915955,"journal":0.10655322670936584,"systems":0.3771725296974182,"targeted":0.23412516713142395,"vanderbilt":0.5658547282218933,"departments":0.1947503387928009,"policy":0.8520675897598267,"_":0.07612555474042892,"cd":0.14742007851600647,"c":0.08780612796545029,"d":0.02286004275083542,"subjects":0.059461385011672974,"j":0.02532157301902771,"mounted":0.0833672508597374,"practices":0.08066949993371964,"r":0.34662505984306335,"intrusion":0.016262361779808998,"##ance":0.3344329297542572,"exploit":0.038894981145858765,"analytic":0.3960074782371521,"publications":0.059259071946144104,"reports":0.3632704019546509,"##ar":0.11940012872219086,"controls":0.17160175740718842,"##tsu":0.02991398796439171,"##and":0.019574791193008423,"language":0.1779775172472,"##ding":0.18959103524684906,"developed":0.12754090130329132,"ds":0.5242580771446228,"analytics":0.6176697015762329,"##ab":0.10068318992853165,"assessment":0.016281498596072197,"attacks":0.08539120107889175,"tim":0.44339221715927124,"implement":0.021503502503037453,"cho":0.5346516370773315,"##anal":0.0888482928276062,"##tri":0.12460793554782867,"##cu":0.18850575387477875,"identifying":0.0022079532500356436,"formats":0.19537000358104706,"##net":0.06958407163619995,"analytical":0.27937787771224976,"sources":0.1531428098678589,"crypt":0.11198952794075012,"cis":0.18133676052093506,"title":0.1433403491973877,"papers":0.06193003058433533,"content":0.30185437202453613,"##cd":0.28527316451072693,"compiled":0.2318304479122162,"tennessee":0.02341093309223652,"sourced":0.08158615976572037,"authorship":0.03514477610588074,"ga":0.25253719091415405,"reporting":0.22276648879051208,"digital":0.27146098017692566,"##du":0.002851901575922966,"identify":0.11558803170919418,"citation":0.4283715784549713,"concerns":0.18997511267662048,"##ec":0.1115662157535553,"##de":0.4143005311489105,"pdf":0.33730456233024597,"nodes":0.006989726796746254,"form":0.302905797958374,"publish":0.06834015250205994,"analyst":0.3869735896587372,"##ura":0.23260508477687836,"contributors":0.1864524930715561,"hd":0.16763094067573547,"practice":0.1948229968547821,"copyright":0.07833284139633179,"##era":0.1062735989689827,"collaborator":0.14853228628635406,"intricate":0.1460569202899933,"responding":0.029307736083865166,"##ifier":0.06788437068462372,"tables":0.05058242753148079,"context":0.22609686851501465,"property":0.16256430745124817,"##em":0.11760064959526062,"guidelines":0.31521114706993103,"model":0.39949798583984375,"text":0.4464409053325653,"id":0.35159969329833984,"##ep":0.11131341755390167,"https":0.025540979579091072,"reduce":0.04427680745720863,"nas":0.22131620347499847,"mapping":0.1525663584470749,"researchers":0.11384031921625137,"ip":0.05171667039394379,"electrical":0.264787882566452,"handle":0.24539673328399658,"schemes":0.1399010717868805,"intelligence":0.03314319998025894,"system":0.49354445934295654,"anal":0.270503968000412,"analyze":0.14035308361053467,"server":0.11226587742567062,"##physical":0.30009061098098755,"##urity":0.12459668517112732,"##rin":0.18722954392433167,"protection":0.11313717812299728,"##fra":0.23517286777496338,"quarterly":0.14316408336162567,"targets":0.15809062123298645,"file":0.25255683064460754,"bibliography":0.09186592698097229,"rights":0.12509982287883759,"electronic":0.22390565276145935,"mal":0.03457567095756531,"map":0.2011367380619049,"##hy":0.06530708074569702,"##age":0.013439471833407879,"topics":0.0999549999833107,"##analysis":0.12277538329362869,"systematic":0.05755247920751572,"hacker":0.32389238476753235,"framework":0.3136243522167206,"la":0.10306905210018158,"report":0.42877981066703796,"cite":0.35172006487846375,"php":0.046984244138002396,"hacked":0.061409130692481995,"governance":0.1762625128030777,"subject":0.24087105691432953,"political":0.36710554361343384,"mca":0.0505998432636261,"networking":0.0091158552095294,"exploitation":0.05425475537776947,"hacking":0.22397306561470032,"##sic":0.10074746608734131,"pages":0.04802699759602547,"ma":0.05411692336201668,"publication":0.31628739833831787,"documented":0.005147858057171106,"implemented":0.10383337736129761,"links":0.12401335686445236,"##ix":0.046110719442367554,"constructing":0.1082177609205246,"author":0.040841441601514816,"na":0.12604887783527374,"202":0.20660099387168884,"nc":0.07265374809503555,"mounting":0.31699439883232117,"perimeter":0.10116458684206009,"compilations":0.26170504093170166,"ng":0.05371144786477089,"##elin":0.17689335346221924,"ni":0.017582817003130913,"harvard":0.08460245281457901,"problems":0.14991149306297302,"np":0.08788318932056427,"code":0.2071293592453003,"##ith":0.10085029900074005,"##yst":0.26273253560066223,"##ela":0.11582739651203156,"ns":0.19996856153011322,"university":0.30527663230895996,"nt":0.14840827882289886,"##ducted":0.035884957760572433,"policies":0.5923827886581421,"##li":0.16949284076690674,"##olic":0.13071684539318085,"harden":0.16458658874034882,"##ber":0.07357387244701385,"ana":0.3074275255203247,"design":0.12455844134092331,"##ack":0.00878168735653162,"paradox":0.6016201972961426,"physical":0.45872950553894043,"department":0.4000469446182251,"initiative":0.06063641607761383,"penetration":0.0576443150639534,"control":0.08890759944915771,"structure":0.18037229776382446,"##iance":0.14755676686763763,"cyber":0.6374145150184631,"##ln":0.07560259848833084,"application":0.14124566316604614,"compilation":0.4955906271934509,"csi":0.05744526535272598,"compliant":0.025938913226127625,"objectives":0.1522798240184784,"threat":0.05993501469492912,"##set":0.024431079626083374,"respond":0.022337891161441803,"incident":0.056522052735090256,"properties":0.2939905524253845,"forms":0.0037021837197244167,"authored":0.03063337318599224,"handles":0.02248317003250122,"compiling":0.24590809643268585,"objective":0.200186088681221,"concern":0.1967221200466156,"password":0.264615535736084,"dynamics":0.0453212708234787,"identification":0.13503406941890717,"contribution":0.09382698684930801,"prep":0.40689149498939514,"publishing":0.14344874024391174,"proposal":0.004776024725288153,"models":0.22475025057792664,"based":0.07052995264530182,"##cture":0.0872935876250267,"vulnerability":0.45755675435066223,"monitoring":0.05328779295086861,"node":0.2267923206090927,"theorem":0.00619195681065321,"concepts":0.22414720058441162,"##nt":0.07252366840839386,"##ructured":6.955789285711944E-4,"21":0.0051214140839874744,"document":0.5289787650108337,"fundamental":0.1825188398361206,"##des":0.15762585401535034,"networks":0.06440650671720505,"proving":0.032411184161901474,"encryption":0.13157810270786285,"##fin":0.13449625670909882,"audit":0.15937377512454987,"reported":0.01583744026720524,"mit":0.778570830821991,"structured":0.33781883120536804,"u2":0.034225184470415115,"##ded":0.017857519909739494,"email":0.07050343602895737,"languages":0.1192782074213028,"##hema":0.05131974071264267,"structures":0.07738504558801651,"dept":0.28264862298965454,"diagram":0.27493607997894287,"##00":0.014506361447274685,"##01":0.3081023693084717,"147":0.13701850175857544,"metric":0.3173581063747406,"ibm":0.024963708594441414,"collaboration":0.3085474669933319,"supported":0.005804123822599649,"##rity":0.2678479850292206,"alumnus":0.02330329641699791,"documents":0.4921739101409912,"##ingen":0.12114101648330688,"##ri":0.2544974386692047,"project":0.5458959937095642,"developing":0.13685011863708496,"organisation":0.009189709089696407,"run":0.23801201581954956,"source":0.32231128215789795,"secure":0.5386306047439575,"challenging":0.16544105112552643,"research":0.5599268078804016,"##21":0.06737709790468216,"presentation":0.07708734273910522,"blackout":0.009030415676534176,"dynamic":0.2986593544483185,"cambridge":0.10623205453157425,"ict":0.022171294316649437,"ur":0.29710257053375244,"##ime":0.013258508406579494,"55":0.1628722846508026,"tech":0.0537070631980896,"##se":0.11212868988513947,"maps":0.03484436869621277,"solutions":0.010584844276309013,"##tion":0.047448962926864624,"develop":0.12856420874595642,"modelling":0.02182154916226864,"##32":0.0497855618596077,"technologies":0.012542681768536568,"##25":0.05427270382642746,"##ru":0.048562631011009216,"obscure":0.07207997888326645,"##tions":0.1675819307565689,"citing":0.15885643661022186,"page":0.08994056284427643,"parameters":0.22132478654384613,"secured":0.19222433865070343,"internet":0.19909049570560455,"##tan":0.29293641448020935,"vu":0.26317691802978516,"analysts":0.19299761950969696,"policing":0.08817403018474579,"submit":0.10121256113052368,"records":0.010997336357831955,"concept":0.40900957584381104,"mass":0.2011508196592331,"privacy":0.321444034576416,"##his":0.13001766800880432,"##fen":0.07341352105140686,"##hip":0.04068906232714653,"##34":0.02406107634305954,"malicious":0.018308447673916817,"##st":0.015411808155477047,"documenting":0.22693325579166412,"##38":0.07036411762237549,"linux":0.04322934150695801,"1717":0.019869016483426094,"1716":0.015610488131642342,"summary":0.21365565061569214,"cases":0.0734008178114891,"wide":0.33955132961273193,"mart":0.04635502025485039,"technology":0.13829657435417175,"##51":0.19135285913944244,"##wide":0.03722134232521057,"##52":0.020379116758704185,"generic":0.3929252624511719,"directive":0.4282437562942505,"target":0.2867112159729004,"##mart":0.2468019425868988,"##45":0.07545102387666702,"1722":0.04916056990623474,"1721":0.39085274934768677,"##46":0.04888632893562317,"##hips":0.08772233873605728,"##47":0.05903966352343559,"##49":0.2309960275888443,"guidance":0.042794156819581985,"infrastructure":0.3737844228744507,"##uc":0.33742934465408325,"##ual":0.17414222657680511,"applications":0.05902928113937378,"modeling":0.20035268366336823,"##ware":0.057544462382793427,"ecosystem":0.2312299907207489,"software":8.973765070550144E-4,"transmitted":0.09608662128448486,"repository":0.03322092443704605,"##vs":0.031550224870443344,"##55":0.33007049560546875,"feedback":0.1677292436361313,"measures":0.1682422161102295,"problem":0.25087007880210876,"identified":0.12118552625179291,"safety":0.39948657155036926,"massachusetts":0.5472524166107178,"proof":0.4844881594181061,"case":0.18385222554206848,"guide":0.177982896566391,"##lica":0.17224997282028198,"researcher":0.1623527705669403,"collaborative":0.11327135562896729,"##tech":0.08680078387260437,"##ders":0.222658172249794,"nsa":0.010352975688874722,"##jit":0.05815210938453674,"geo":0.00438648508861661,"computer":0.08821798861026764,"web":0.03197501227259636,"power":0.2304418832063675,"##ecure":0.08674904704093933,"architecture":0.05421127378940582,"situ":0.2945811152458191,"##bution":0.1109088584780693,"##ifiers":0.03207244724035263,"electricity":0.2102687656879425,"lead":0.19565151631832123,"##ort":0.2484651356935501,"conceptual":0.13217273354530334,"grid":0.3877498209476471,"organization":0.21469703316688538,"##ya":0.1720818728208542,"##virus":0.08016129583120346,"submission":0.13398736715316772,"##wal":0.19115020334720612,"governed":0.2913575768470764,"statistics":0.22469434142112732,"date":0.1432856023311615,"data":0.40346866846084595,"nun":0.2093040943145752,"##rill":0.24129819869995117,"forensic":0.017843974754214287,"space":0.15341146290302277,"reference":0.04151657596230507,"barrier":0.10215180367231369,"1653":0.06855060160160065,"major":0.004964148625731468,"1652":0.058509305119514465,"presented":0.07224864512681961,"1650":0.20894649624824524,"das":0.009738964028656483,"development":0.14115428924560547,"offset":0.39883607625961304,"resource":0.29856550693511963,"kind":0.053787052631378174,"##pace":0.4774037301540375,"format":0.32893818616867065,"published":0.25586220622062683,"##ition":0.08642226457595825,"##pro":0.14712272584438324,"eds":0.021851012483239174,"fraud":0.07790643721818924,"safe":0.10442058742046356,"topic":0.09450533241033554,"files":0.09398303180932999,"##att":0.04226376861333847,"politics":0.03602929785847664,"critical":0.36727145314216614,"challenges":0.34066450595855713,"purpose":0.2950150668621063,"##duction":0.2909848690032959,"link":0.12449145317077637,"diagrams":0.257127970457077,"##fine":0.08855520188808441,"imp":0.21164283156394958,"network":0.2485916018486023,"##0":0.05774230137467384,"general":0.041412629187107086,"security":0.692716658115387,"database":0.1371305137872696,"targeting":0.09379316121339798,"contributor":0.09491313993930817,"##4":0.06515686959028244,"paper":0.057491518557071686,"parameter":0.024371862411499023,"matrices":0.08933504670858383,"value":0.4566603899002075,"##ass":0.1344771683216095,"breach":0.12246336042881012,"process":0.09203315526247025,"requirements":0.07355997711420059,"implementation":0.3002133369445801,"electric":0.24092997610569,"resources":0.20721140503883362,"##ont":0.09332072734832764,"##bers":0.2133735567331314,"governing":0.10440192371606827,"barriers":0.18030862510204315,"##wall":0.03366374224424362,"compliance":0.3132564425468445,"response":0.06641685217618942,"challenge":0.41575950384140015,"reduction":0.00979398563504219,"timothy":0.1248047724366188,"methodology":0.162016361951828},"dates":[{"kind":"Publication date","value":"2024-10-08"}],"source":"DSpace@MIT","title":"Policy Analytics for Cybersecurity of Cyber-Physical Systems","source_link":"https://dspace.mit.edu/handle/1721.1/165055","content_type":["Preprint"],"rights":[{"description":"Attribution-NoDerivs 3.0 United States","kind":"useAndReproduction"}],"links":[{"url":"https://hdl.handle.net/1721.1/165055","kind":"Digital object URL","text":"Digital object URL"}],"contributors":[{"value":"Choucri, Nazli","kind":"author"},{"value":"Massachusetts Institute of Technology. Department of Political Science","kind":"department"}],"timdex_record_id":"dspace:1721.1-165055"},"sort":[9.855363,1728345600000]},{"_index":"dspace-2026-02-09t19-23-02","_id":"dspace:1721.1-155172","_score":9.834821,"_source":{"summary":["The proliferation of environmentally oriented programs within the tech industry, and the industry's coinciding efforts toward data and technology democratization, generate concerns about the status of environmental data within digital economy. While the accumulation of digital personal data has been a cornerstone of domination of the data analytics industry, many believe environmental data to be a source of “untapped potential.” The potential of environmental data, the argument goes, would benefit equally the digital economy, environmental sciences, and academic data and artificial intelligence experts. This article analyzes the proliferation of the rhetoric about open environmental data by focusing on Microsoft's Planetary Computer cloud computing program and computer vision experts who curate and use biodiversity data stored on Microsoft's servers. Through an analytical framework of sociotechnical imaginaries, the article draws connections between visions of future for environmental knowledge production and governance promoted by Microsoft and the work of computer vision experts intending to benefit from the potential of environmental data as machine learning training sets while at the same time helping environmental sciences. Although environmental data on the Planetary Computer is democratized, it nonetheless becomes a valued asset to data economy, but often with unintended consequences, such as enabling citizen science biodiversity data to be used by state surveillance apparatus. The article challenges the view that data's democratization is unproblematically serving environmental sciences by examining the consequences of imaginaries of democratization emerging from the data industry leaders and processes of nonmonetary valuation of environmental data by experts who curate these datasets."],"timdex_provenance":{"source":"dspace","run_date":"2026-03-01","run_id":"3b5fabfb-9ee6-7cac-94a6-3b70ba14679d_7abd3cf1-9ede-4d69-259a-9fc8edfb66a5","run_record_offset":129},"languages":["en_US"],"citation":"Lukacz, P. M. (2024). Imaginaries of democratization  and the value of open environmental data: Analysis of Microsoft’s planetary computer. Big Data & Society, 11(2).","file_formats":["application/pdf"],"identifiers":[{"value":"2053-9517","kind":"issn"},{"value":"https://hdl.handle.net/1721.1/155172","kind":"uri"}],"format":"electronic resource","embedding_full_record":{"pr":0.20855014026165009,"inform":0.006584869232028723,"objects":0.0952901765704155,"pollution":0.21596167981624603,"expertise":0.09704595804214478,"dem":0.026941683143377304,"##nk":0.013570986688137054,"concern":0.10540108382701874,"analyzing":0.12095053493976593,"contribution":0.0039902799762785435,"record":0.08264709264039993,"##x":0.2482665479183197,"##ances":0.012936326675117016,"##my":0.11560401320457458,"publishing":0.243905171751976,"societies":0.11448270082473755,"knowledge":0.41912439465522766,"using":0.0028756035026162863,"environmental":0.957639217376709,"ai":0.28598180413246155,"##ized":0.21824651956558228,"personal":0.19067128002643585,"google":0.08191899210214615,"economy":0.28479844331741333,"analysis":0.33120813965797424,"benefit":0.33388885855674744,"node":0.1950647234916687,"valuation":0.24706465005874634,"science":0.25890228152275085,"domain":0.02835041470825672,"programs":0.011283018626272678,"object":0.23657944798469543,"@":0.05723048374056816,"statistical":0.01854875311255455,"argued":0.03703547269105911,"sustainable":0.013720753602683544,"cited":0.2505488395690918,"industry":0.3928072154521942,"global":0.13350871205329895,"proven":0.26645469665527344,"believe":0.07690484076738358,"##des":0.15060952305793762,"civic":0.015995748341083527,"worth":0.02236994355916977,"serving":0.014567587524652481,"promote":0.022433938458561897,"diversity":0.242380291223526,"democrat":0.5717180967330933,"citations":0.2730453908443451,"journal":0.0769108459353447,"mit":0.4985615015029907,"visions":0.08609767258167267,"wikipedia":0.016025561839342117,"cornerstone":0.20166823267936707,"u2":0.22029878199100494,"##ities":0.03850628063082695,"computers":0.3433530628681183,"emerging":0.1850433498620987,"enabling":0.036789391189813614,"languages":0.1495412290096283,"d":0.060073040425777435,"democrats":0.21686115860939026,"socio":0.08874396234750748,"benefited":0.041695449501276016,"xbox":0.041524488478899,"democracy":0.4539027214050293,"##00":0.05321521311998367,"##01":0.3740650713443756,"ibm":0.15542301535606384,"planetary":0.638927698135376,"information":0.325020968914032,"emerge":0.10204385966062546,"##ance":0.2830584645271301,"technological":0.1598358154296875,"##izations":0.14858722686767578,"experts":0.09184237569570541,"analytic":0.0883086696267128,"open":0.6614389419555664,"citizens":0.19599810242652893,"publications":0.2582312226295471,"liberal":0.11890272796154022,"##mer":0.12632960081100464,"##ri":0.011592765338718891,"project":0.09525147080421448,"language":0.15608692169189453,"run":0.09951156377792358,"source":0.3236405849456787,"##ding":0.08205891400575638,"microsoft":0.710879385471344,"##ally":2.7626569499261677E-4,"research":0.08529271185398102,"ds":0.569587230682373,"analytics":0.3123241066932678,"sciences":0.16859503090381622,"155":0.3503921627998352,"view":0.08779000490903854,"##mut":0.011759702116250992,"##16":0.03616945445537567,"##17":0.27766042947769165,"##mony":0.0248235072940588,"tim":0.5070005655288696,"cambridge":0.03132150322198868,"ict":0.07287528365850449,"ur":0.17498467862606049,"info":0.04450036212801933,"computational":0.043382592499256134,"tech":0.14689908921718597,"##rating":0.11759848147630692,"planet":0.3328576683998108,"##sl":0.1493796706199646,"##ended":0.1663937121629715,"article":0.30032697319984436,"technologies":0.25931909680366516,"vision":0.2515312731266022,"curator":0.13109876215457916,"##bf":0.15792308747768402,"##tri":0.0035444851964712143,"beneficial":0.1050763949751854,"spaces":0.08350890874862671,"citing":0.16582801938056946,"useful":0.09313325583934784,"coin":0.2907187044620514,"benefits":0.2138475626707077,"formats":0.13221195340156555,"analytical":0.2474525272846222,"sources":0.14357775449752808,"production":0.03215177357196808,"##cz":0.27829742431640625,"privacy":0.021798601374030113,"learning":0.2211502641439438,"training":0.11607679724693298,"##eta":0.037810150533914566,"title":0.03161260113120079,"##kow":0.01378566399216652,"content":0.19195415079593658,"ozone":0.010623850859701633,"skyla":0.17530587315559387,"society":0.3901752531528473,"ecology":0.03270626813173294,"sourced":0.1462593972682953,"authorship":0.07456739246845245,"##sz":0.05737731605768204,"democratic":0.502338707447052,"surveillance":0.20182174444198608,"peat":0.03597504273056984,"##com":0.05268209055066109,"digital":0.6037920713424683,"summary":0.07575780898332596,"green":0.32520803809165955,"citation":0.3529687523841858,"argue":0.049683213233947754,"technology":0.3460521996021271,"windows":0.2551928162574768,"concerns":0.1585519015789032,"futures":0.10004878044128418,"storing":0.041441917419433594,"##de":0.4748181104660034,"##bly":0.046797800809144974,"1722":0.029014142230153084,"environment":0.7956183552742004,"1721":0.3685874342918396,"artificial":0.3183639645576477,"pdf":0.22068379819393158,"##isation":0.17115512490272522,"publish":0.08781294524669647,"analyst":0.043791089206933975,"contributors":0.1204037293791771,"hd":0.060936059802770615,"articles":0.08599361032247543,"big":0.37004637718200684,"expert":0.1679455041885376,"copyright":0.10740923136472702,"software":0.18215125799179077,"ecosystem":0.08987870812416077,"##ble":0.27103614807128906,"##nta":0.14941078424453735,"bio":0.15961143374443054,"##ize":0.16971832513809204,"program":0.1681315153837204,"##vs":0.03358672559261322,"##iza":0.04757000133395195,"##ifier":0.010954968631267548,"epa":0.5769003629684448,"##space":0.010924916714429855,"id":0.22486631572246552,"azure":0.1811218559741974,"ecological":0.27757954597473145,"##nation":0.019332433119416237,"im":0.47657909989356995,"##pped":0.24647140502929688,"matt":0.08000479638576508,"handle":0.07815210521221161,"##tech":0.2159467339515686,"intel":0.03612895309925079,"creative":0.039456017315387726,"intelligence":0.26062655448913574,"conservation":0.01377936452627182,"issn":0.2424430400133133,"anal":0.03807324171066284,"analyze":0.1157510057091713,"opens":0.11807260662317276,"valuable":0.2537994086742401,"status":0.17439444363117218,"##nar":0.32159626483917236,"server":0.15800750255584717,"semantic":0.0016424168134108186,"##opus":0.01285668183118105,"solar":0.24477523565292358,"##ization":0.40502890944480896,"commons":0.3271509110927582,"geo":0.12985648214817047,"computer":0.5118081569671631,"##mon":0.21662278473377228,"file":0.17180803418159485,"planets":0.23326101899147034,"rights":0.13033504784107208,"electronic":0.17173391580581665,"accumulate":0.09361431002616882,"##agi":0.35256895422935486,"##bution":0.06309644877910614,"consequence":0.013779634609818459,"implications":0.04063049703836441,"proliferation":0.3871406316757202,"techno":0.017130030319094658,"##analysis":0.05054590851068497,"climate":0.06139377877116203,"abstract":0.023782839998602867,"nasa":0.03904031217098236,"framework":0.19425147771835327,"future":0.30818989872932434,"machine":0.2613254487514496,"curated":0.24225641787052155,"stored":0.24411877989768982,"industries":0.09941481798887253,"cite":0.285324364900589,"##ration":0.11601662635803223,"##matic":0.0707002654671669,"asset":0.2848440706729889,"economic":0.21023547649383545,"governance":0.23570480942726135,"date":0.035882700234651566,"argument":0.28698107600212097,"data":0.981550395488739,"environments":0.2072492092847824,"##izing":0.0956932082772255,"use":0.10117553174495697,"wwf":0.06441573798656464,"moderator":0.030283158645033836,"lu":0.44154173135757446,"##ies":0.2680078148841858,"used":0.13400408625602722,"space":0.26818472146987915,"cloud":0.45598459243774414,"eco":0.27238041162490845,"assets":0.06993768364191055,"academia":0.028459440916776657,"academic":0.08835941553115845,"publication":0.3112300932407379,"host":0.17358654737472534,"sage":0.5202959179878235,"consequences":0.14910221099853516,"publishers":0.10021016001701355,"links":0.08477737754583359,"##ze":0.04202134907245636,"rhetoric":0.250410795211792,"potential":0.4929376244544983,"##ties":0.09754648804664612,"##ium":0.008295216597616673,"citizen":0.3338492214679718,"offset":0.301104336977005,"resource":0.29429903626441956,"accumulation":0.28188490867614746,"##ka":0.27347350120544434,"kind":0.07043073326349258,"ms":0.002063110237941146,"##pace":0.5303755402565002,"format":0.1764538288116455,"1550":0.02067301608622074,"opened":0.2505062520503998,"published":0.2525362968444824,"sustainability":0.01741463877260685,"economies":0.12907840311527252,"##ity":0.09944295138120651,"license":0.09471320360898972,"efforts":0.1338716447353363,"##pro":0.27203118801116943,"202":0.1634114533662796,"scientists":0.017774706706404686,"205":0.1648096889257431,"publisher":0.20560890436172485,"files":0.02893361635506153,"topic":0.0026730140671133995,"environmentally":0.6511920690536499,"oriented":0.1892649531364441,"##duction":0.29113849997520447,"challenges":0.2162867784500122,"university":0.09471544623374939,"values":0.2523362636566162,"curate":0.1736440509557724,"##zed":0.05174295976758003,"link":0.09375612437725067,"clouds":0.3342892527580261,"storage":0.047244805842638016,"##0":0.01518387533724308,"database":0.3982866108417511,"computing":0.36677467823028564,"servers":0.09421923756599426,"contributor":0.06431445479393005,"##9":0.04605719447135925,"value":0.6248470544815063,"wildlife":0.12589514255523682,"biodiversity":0.5118732452392578,"##zation":9.008422493934631E-4,"social":0.03584308177232742,"resources":0.20526662468910217,"##zcz":0.062237855046987534,"cyber":0.09915608167648315,"economics":0.09353553503751755,"application":0.03685908019542694,"valued":0.22964398562908173,"earth":0.055132776498794556,"challenge":0.15652737021446228,"uses":0.066822849214077,"##set":0.2164408266544342,"timothy":0.13613562285900116,"##ification":0.03912912309169769},"dates":[{"kind":"Publication date","value":"2024-04-03"}],"source":"DSpace@MIT","title":"Imaginaries of democratization and the value of open environmental data: Analysis of Microsoft's planetary computer","related_items":[{"description":"Big Data & Society","relationship":"host"}],"source_link":"https://dspace.mit.edu/handle/1721.1/155172","content_type":["Article"],"rights":[{"description":"Creative Commons Attribution-NonCommercial-NoDerivs License","kind":"useAndReproduction"}],"publishers":[{"name":"SAGE Publications"}],"links":[{"url":"https://hdl.handle.net/1721.1/155172","kind":"Digital object URL","text":"Digital object URL"}],"contributors":[{"value":"Lukacz, Przemyslaw Matt","kind":"author"}],"timdex_record_id":"dspace:1721.1-155172"},"sort":[9.834821,1712102400000]},{"_index":"dspace-2026-02-09t19-23-02","_id":"dspace:1721.1-156704","_score":9.805464,"_source":{"summary":["In this chapter we discuss recent trends in the application of urban big data and their impact on real estate markets. We expect such technologies to improve quality of life and the productivity of cities over the long run.\r\n\r\nWe forecast that smart city technologies will reinforce the primacy of the most successful global metropolises at least for a decade or more. A few select metropolises in emerging countries may also leverage these technologies to leapfrog on the provision of local public services. In the long run, all cities throughout the urban system will end up adopting successful and cost-effective smart city initiatives. Nevertheless, smaller scale interventions are likely to crop up everywhere, even in the short run. Such targeted programs are more likely to improve conditions in blighted or relatively deprived neighborhoods, which could generate gentrification and higher valuations there.\r\n\r\nIt is unclear whether urban information systems will have a centralizing or suburbanizing impact. They are likely to make denser urban centers more attractive, but they are also bound to make suburban or exurban locations more accessible."],"timdex_provenance":{"source":"dspace","run_date":"2026-03-01","run_id":"3b5fabfb-9ee6-7cac-94a6-3b70ba14679d_7abd3cf1-9ede-4d69-259a-9fc8edfb66a5","run_record_offset":60},"languages":["en"],"citation":"Barkham, R., Bokhari, S., Saiz, A. (2022). Urban Big Data: City Management and Real Estate Markets. In: Pardalos, P.M., Rassia, S.T., Tsokas, A. (eds) Artificial Intelligence, Machine Learning, and Optimization Tools for Smart Cities. Springer Optimization and Its Applications, vol 186. Springer, Cham.","file_formats":["application/pdf"],"identifiers":[{"value":"https://hdl.handle.net/1721.1/156704","kind":"uri"}],"format":"electronic resource","embedding_full_record":{"projections":0.1401839703321457,"inform":0.08534654229879379,"objects":0.03950889781117439,"##i":0.059320710599422455,"barking":0.21691149473190308,"geography":0.09725580364465714,"record":0.14138011634349823,"##x":0.22025249898433685,"initiatives":0.323788583278656,"##z":0.09848258644342422,"publishing":0.33241528272628784,"recent":0.2539703845977783,"chicago":0.10729643702507019,"##city":0.48995548486709595,"springer":0.46936991810798645,"trends":0.39358001947402954,"successfully":0.2669741213321686,"neighborhoods":0.1828674077987671,"prima":0.29669564962387085,"ras":0.3055306673049927,"metropolis":0.2419874519109726,"mayor":0.17439159750938416,"impact":0.5216153860092163,"expected":0.28854793310165405,"ai":0.43886223435401917,"##og":0.10441479086875916,"forecast":0.3528292179107666,"leaps":0.15168383717536926,"analysis":0.00846954993903637,"benefit":0.1987144947052002,"quality":0.2405805140733719,"planning":0.2023746371269226,"valuation":0.20860765874385834,"adopt":0.16405142843723297,"##bation":0.003334695938974619,"municipal":0.286393404006958,"adopting":0.21410155296325684,"institute":0.2989825904369354,"programs":0.07054341584444046,"object":0.15010201930999756,"boston":0.2622091770172119,"chapter":0.1611601859331131,"mega":0.056975606828927994,"accessible":0.04296526685357094,"statistical":0.008599650114774704,"##polis":0.09969201683998108,"housing":0.06385874003171921,"cited":0.1673237532377243,"global":0.2652430534362793,"proven":0.29034799337387085,"##des":0.072894386947155,"bo":0.31585660576820374,"##ban":0.32425618171691895,"citations":0.22568538784980774,"adoption":0.20513787865638733,"##market":0.1834978312253952,"journal":0.010370162315666676,"urbana":0.05330430343747139,"##os":0.03435099869966507,"systems":0.2945594787597656,"managed":0.056782178580760956,"does":0.030543256551027298,"targeted":0.22123079001903534,"mit":0.5612893104553223,"##oka":0.33758944272994995,"departments":0.02278643101453781,"emerging":0.3196992874145508,"densely":0.19427794218063354,"b":0.18672741949558258,"density":0.23139028251171112,"languages":0.10524851083755493,"manager":0.07119967043399811,"d":0.04994354397058487,"dept":0.09173927456140518,"services":0.02477504126727581,"marketing":0.18472819030284882,"automated":0.12061234563589096,"r":0.00902861449867487,"interventions":0.25775349140167236,"advantages":0.13035660982131958,"ibm":0.11407007277011871,"information":0.5379797220230103,"emerge":0.027239402756094933,"##ance":0.2643630802631378,"technological":0.07185225188732147,"adopted":0.1335841715335846,"ts":0.2726966142654419,"publications":0.042062755674123764,"##mer":0.10041651874780655,"##oit":0.01003533136099577,"developing":0.025915149599313736,"project":0.012210002169013023,"run":0.25178050994873047,"language":0.07734430581331253,"source":0.2282906174659729,"research":0.01145964302122593,"ds":0.5986661314964294,"analytics":0.32444050908088684,"3d":0.026516642421483994,"156":0.29739516973495483,"bark":0.5216007232666016,"tim":0.4510343074798584,"cambridge":0.16789324581623077,"##imi":0.20152366161346436,"ict":0.0638674795627594,"ur":0.11311544477939606,"cha":0.04817728325724602,"generate":0.045821674168109894,"computational":0.010864618234336376,"par":0.2650246322154999,"richard":0.1673041582107544,"tech":0.021603159606456757,"attractive":0.21049143373966217,"metropolitan":0.21672242879867554,"solutions":0.12042980641126633,"bloomberg":0.11653478443622589,"article":0.1557273417711258,"dense":0.2759205400943756,"technologies":0.49269813299179077,"wiley":0.02381950616836548,"improving":0.2543458640575409,"ex":0.1912124752998352,"##bf":0.13360877335071564,"##tri":0.3928034007549286,"mls":0.07897666096687317,"success":0.4249723255634308,"spaces":0.11391180753707886,"citing":0.010226800106465816,"neighborhood":0.2313847690820694,"useful":0.061846498399972916,"crop":0.0738658532500267,"internet":0.03927037492394447,"benefits":0.1886419802904129,"##ali":0.0483507439494133,"formats":0.06075581908226013,"sources":0.07724282145500183,"applied":0.19828961789608002,"##fying":0.03685636818408966,"mass":0.21689191460609436,"edition":0.0011931265471503139,"learning":0.22666555643081665,"content":0.0811300203204155,"smarter":0.2370360791683197,"##dal":0.24179880321025848,"central":0.2697153687477112,"##fied":0.12972936034202576,"successful":0.46156492829322815,"##com":0.07203519344329834,"digital":0.3585423529148102,"effectiveness":0.1965980976819992,"summary":0.12269668281078339,"citation":0.3052418828010559,"effectively":0.08205591887235641,"center":0.07450546324253082,"technology":0.4924424886703491,"improvement":0.1685573160648346,"##ur":0.23877960443496704,"##de":0.3761538863182068,"artificial":0.49412158131599426,"1721":0.33919239044189453,"pdf":0.18314826488494873,"urban":0.7134478092193604,"management":0.4212340712547302,"infrastructure":0.20691759884357452,"succeed":0.14176632463932037,"publish":0.08926717936992645,"contributors":0.04779329150915146,"hd":0.08862102776765823,"articles":0.009080346673727036,"applications":0.29019781947135925,"big":0.7156572937965393,"decade":0.04742911458015442,"modeling":0.12954527139663696,"software":0.1266930252313614,"estates":0.09666062146425247,"##ova":0.08527058362960815,"trend":0.33972403407096863,"improves":0.08760450780391693,"##ize":0.04429179057478905,"program":0.08729840815067291,"improved":0.2911769151687622,"optimization":0.2900022864341736,"reinforce":0.1579500287771225,"zoning":0.04810115694999695,"massachusetts":0.5504817962646484,"property":0.1789003610610962,"centers":0.07247471809387207,"id":0.18642106652259827,"spatial":0.15736208856105804,"generation":0.025800101459026337,"likely":0.2766180634498596,"##fy":0.06509701162576675,"large":0.25901055335998535,"##aging":0.0688416138291359,"handle":0.07328426092863083,"impacts":0.3802437484264374,"reinforced":0.011498188599944115,"deprived":0.1622665822505951,"creative":0.0013907633256167173,"intelligence":0.4406392276287079,"system":0.27655336260795593,"issn":0.007167704403400421,"metro":0.19359762966632843,"driven":0.018753182142972946,"##fr":0.14869850873947144,"managers":0.12009971588850021,"valuable":0.021506257355213165,"suburbs":0.401684433221817,"algorithms":0.06217828765511513,"city":0.9666189551353455,"##ization":0.12237793952226639,"tools":0.39052814245224,"smart":0.7838570475578308,"local":0.24024848639965057,"commons":0.22995172441005707,"gen":0.3706226646900177,"suburban":0.4281647503376007,"electronic":0.17198635637760162,"leap":0.23539720475673676,"share":0.027647288516163826,"##fication":0.3575572371482849,"predicting":0.005938361398875713,"##bution":0.03708871081471443,"implications":0.14966000616550446,"m2":0.005237497854977846,"globalization":0.08925893902778625,"implementing":0.02824171632528305,"expect":0.17344874143600464,"future":0.2729673981666565,"machine":0.23715026676654816,"grid":0.031240105628967285,"##khar":0.3168095648288727,"cite":0.23351429402828217,"economic":0.023792972788214684,"improvements":0.04428465664386749,"date":0.06689444929361343,"data":0.858656644821167,"##izing":0.09162696450948715,"use":0.07016243040561676,"municipality":0.04137998819351196,"autonomous":0.0606221929192543,"planners":0.007665123790502548,"space":0.2542840242385864,"centralized":0.11348838359117508,"cloud":0.0862370952963829,"automation":0.1533161699771881,"ma":0.18592239916324615,"successes":0.12025909870862961,"biggest":0.08568278700113297,"##sia":0.15526646375656128,"publication":0.3080557882785797,"implemented":0.016611585393548012,"publishers":0.11659819632768631,"international":0.1662949025630951,"potential":0.06240147724747658,"development":0.02761646918952465,"cities":0.7717313766479492,"offset":0.3959893584251404,"marketplace":0.08804726600646973,"resource":0.20648406445980072,"kind":0.07874076813459396,"##pace":0.5187349319458008,"estate":0.4756513833999634,"format":0.09180416911840439,"real":0.4427936375141144,"published":0.278761088848114,"lever":0.15583491325378418,"tool":0.30048471689224243,"market":0.46620702743530273,"markets":0.44313302636146545,"efforts":0.08854459226131439,"effects":0.03840510547161102,"##pro":0.1851738691329956,"202":0.24779343605041504,"eds":0.24575641751289368,"improve":0.346388041973114,"effect":0.15516270697116852,"publisher":0.18273036181926727,"managing":0.16755689680576324,"intervention":0.18117186427116394,"leverage":0.22383639216423035,"code":0.0189793910831213,"##duction":0.25677359104156494,"university":0.17988169193267822,"##har":0.2332463562488556,"link":0.03100156970322132,"scale":0.23524068295955658,"##ham":0.22231359779834747,"effective":0.3515866994857788,"projected":0.05516262352466583,"database":0.3035520017147064,"targeting":0.09871981292963028,"computing":0.0770440399646759,"##2":0.06058964505791664,"productivity":0.3403632640838623,"public":0.05957052484154701,"albert":0.27018100023269653,"studies":0.05297514423727989,"sai":0.37120795249938965,"department":0.1755354106426239,"value":0.4876960515975952,"##light":0.2749512493610382,"applying":0.03272309899330139,"initiative":0.269153356552124,"cost":0.019235974177718163,"will":0.32694172859191895,"advantage":0.03319155424833298,"implementation":0.14281277358531952,"resources":0.14324240386486053,"municipalities":0.24801526963710785,"intelligent":0.18403106927871704,"economics":0.02493765391409397,"application":0.31939730048179626,"##yar":0.08306445926427841,"productive":0.1824491322040558,"suburb":0.13544636964797974,"nyc":0.03830505162477493,"timothy":0.06735052168369293},"dates":[{"kind":"Publication date","value":"2022"}],"source":"DSpace@MIT","title":"Urban Big Data: City Management and Real Estate Markets","source_link":"https://dspace.mit.edu/handle/1721.1/156704","content_type":["Article"],"rights":[{"description":"Creative Commons Attribution-Noncommercial-ShareAlike","kind":"useAndReproduction"}],"publishers":[{"name":"Springer International Publishing"}],"links":[{"url":"https://hdl.handle.net/1721.1/156704","kind":"Digital object URL","text":"Digital object URL"}],"contributors":[{"value":"Barkham, Richard","kind":"author"},{"value":"Bokhari, Sheharyar","kind":"author"},{"value":"Saiz, Albert","kind":"author"},{"value":"Massachusetts Institute of Technology. Department of Urban Studies and Planning","kind":"department"},{"value":"Massachusetts Institute of Technology. Center for Real Estate","kind":"department"}],"timdex_record_id":"dspace:1721.1-156704"},"sort":[9.805464,1640995200000]},{"_index":"dspace-2026-02-09t19-23-02","_id":"dspace:1721.1-157266","_score":9.738817,"_source":{"summary":["Artificial intelligence (AI) has become a transformative force across various disciplines, including urban planning. It has unprecedented potential to address complex challenges. An essential task is to facilitate informed decision making regarding the integration of constantly evolving AI analytics into planning research and practice. This paper presents a review of how AI methods are applied in urban studies, focusing particularly on carbon neutrality planning. We highlight how AI is already being used to generate new scientific knowledge on the interactions between human activities and nature. We consider the conditions in which the advantages of AI-enabled urban studies can positively influence decision-making outcomes. We also consider the importance of interdisciplinary collaboration, responsible AI governance, and community engagement in guiding data-driven methods and suggest how AI can contribute to supporting carbon-neutrality goals."],"timdex_provenance":{"source":"dspace","run_date":"2026-03-01","run_id":"3b5fabfb-9ee6-7cac-94a6-3b70ba14679d_7abd3cf1-9ede-4d69-259a-9fc8edfb66a5","run_record_offset":529},"citation":"Cong, C.; Page, J.; Kwak, Y.; Deal, B.; Kalantari, Z. AI Analytics for Carbon-Neutral City Planning: A Systematic Review of Applications. Urban Sci. 2024, 8, 104.","file_formats":["application/pdf"],"identifiers":[{"value":"https://hdl.handle.net/1721.1/157266","kind":"uri"},{"value":"PUBLISHER_CC","kind":"mitlicense"}],"format":"electronic resource","embedding_full_record":{"authored":0.07231736183166504,"inform":0.1992703229188919,"strategic":0.018503477796912193,"objects":0.07213416695594788,"##i":0.006379297468811274,"discipline":0.0670488253235817,"facilitated":0.01761423796415329,"pollution":0.012718310579657555,"building":0.02259322814643383,"analyzing":0.061783842742443085,"contribution":0.15195900201797485,"contributions":0.05753938853740692,"identification":0.02813098579645157,"outcomes":0.16598781943321228,"record":0.17070218920707703,"complex":0.003962114918977022,"##x":0.2652757465839386,"sci":0.22725984454154968,"initiatives":0.006992309354245663,"##ances":0.039989303797483444,"publishing":0.39420852065086365,"chicago":0.10723680257797241,"##city":0.10787098854780197,"knowledge":0.28485986590385437,"goals":0.24832114577293396,"models":0.02788669988512993,"using":0.03420861437916756,"mayor":0.09123044461011887,"impact":0.01691107451915741,"ai":0.7672895193099976,"neutral":0.5727460980415344,"analysis":0.43815475702285767,"community":0.2196015566587448,"interdisciplinary":0.33586418628692627,"benefit":0.07735676318407059,"planning":0.6969754099845886,"plans":0.3211684226989746,"science":0.10619672387838364,"warming":0.08082469552755356,"municipal":0.26285019516944885,"institute":0.3248865306377411,"object":0.19334474205970764,"boston":0.2555510997772217,"@":0.0728084146976471,"deal":0.3565342426300049,"statistical":0.16295361518859863,"activity":0.0797741636633873,"sustainable":0.025562401860952377,"cited":0.308601975440979,"proven":0.29102203249931335,"##des":0.23267404735088348,"adaptive":0.09505265951156616,"how":0.02721831016242504,"citations":0.35686734318733215,"journal":0.17614367604255676,"urbana":0.004552333615720272,"mit":0.6096349954605103,"departments":0.10549873113632202,"##ded":0.13716959953308105,"emerging":0.020685695111751556,"email":0.016563313081860542,"cc":0.07360918074846268,"enabling":0.11875684559345245,"c":0.07167989760637283,"decision":0.39847955107688904,"d":0.1593010276556015,"j":0.022490302100777626,"dept":0.15388080477714539,"co":0.17527158558368683,"practices":0.10922011733055115,"evolve":0.07847420126199722,"automated":0.09146296977996826,"advantages":0.2834923267364502,"metric":0.05903392657637596,"collaboration":0.28015637397766113,"unprecedented":0.10764697194099426,"z":0.04012702777981758,"##ance":0.3104928433895111,"analytic":0.3653605580329895,"essential":0.19866341352462769,"publications":0.12282438576221466,"supported":0.005542430095374584,"engagement":0.27921348810195923,"##ri":0.19893847405910492,"project":0.10882294923067093,"run":0.2343788594007492,"source":0.2872168719768524,"challenging":0.037857409566640854,"research":0.48169344663619995,"ds":0.6437534689903259,"analytics":0.5414751172065735,"zero":0.2549031674861908,"157":0.3710242807865143,"tim":0.5362935662269592,"##ak":0.214310422539711,"cambridge":0.17093521356582642,"ur":0.16592583060264587,"generate":0.0805879607796669,"contributed":0.010354691185057163,"tech":0.0025046784430742264,"making":0.21524356305599213,"solutions":0.058065399527549744,"article":0.23658615350723267,"technologies":0.1583688110113144,"##25":0.12543751299381256,"##26":0.2900700271129608,"##bf":0.13552822172641754,"##tri":0.013053578324615955,"spaces":0.12551502883434296,"citing":0.17453689873218536,"page":0.34651273488998413,"support":0.09594341367483139,"useful":0.08118769526481628,"benefits":0.1352979689836502,"analysts":0.09690916538238525,"formats":0.1335248500108719,"analytical":0.24809473752975464,"sources":0.1612001657485962,"applied":0.400658518075943,"records":0.02911366894841194,"importance":0.20617826282978058,"mass":0.24471774697303772,"generating":0.05835161730647087,"title":0.08217684179544449,"papers":0.0968458503484726,"##da":0.055150650441646576,"content":0.13523933291435242,"sourced":0.06473223865032196,"authorship":0.13381285965442657,"responsible":0.14330273866653442,"emissions":0.15626701712608337,"human":0.13174138963222504,"digital":0.4366913139820099,"summary":0.0712430477142334,"citation":0.4162903428077698,"apply":0.06363292783498764,"reviewing":0.14658698439598083,"jess":0.008375178091228008,"technology":0.18335238099098206,"##de":0.571442186832428,"artificial":0.6808552742004395,"1721":0.3452003598213196,"##46":0.047772929072380066,"pdf":0.2271570861339569,"berkeley":0.04312417656183243,"urban":0.6743624210357666,"disciplines":0.22263602912425995,"management":0.023320429027080536,"infrastructure":0.018403830006718636,"publish":0.2061080038547516,"analyst":0.23597978055477142,"contributors":0.13408637046813965,"articles":0.08136263489723206,"applications":0.3104793131351471,"practice":0.2022295594215393,"copyright":0.004533988889306784,"modeling":0.10988948494195938,"##ova":0.05320790037512779,"software":0.009879212826490402,"##nta":0.3545236885547638,"focus":0.02292454242706299,"cong":0.5785154700279236,"collaborate":0.06940234452486038,"approach":0.05306495353579521,"multi":0.2517147362232208,"collaborator":0.0988779291510582,"##ifier":0.06329630315303802,"carbon":0.8301328420639038,"review":0.44496166706085205,"enable":0.08860013633966446,"massachusetts":0.5672842264175415,"model":0.013932784087955952,"id":0.32638731598854065,"spatial":0.10759305208921432,"plan":0.37909582257270813,"##nse":0.07483720034360886,"guide":0.003447607858106494,"algorithm":0.055464718490839005,"cooperation":0.023992789909243584,"goal":0.20324862003326416,"method":0.28553536534309387,"researchers":0.062287554144859314,"collaborative":0.13540048897266388,"##lice":0.07894132286310196,"za":0.132134348154068,"handle":0.03885762020945549,"being":0.07555237412452698,"creative":0.09640195220708847,"intelligence":0.5341018438339233,"seoul":0.07119648158550262,"anal":0.11683714389801025,"analyze":0.04281589388847351,"integration":0.27180013060569763,"driven":0.23634940385818481,"force":0.24364928901195526,"authors":0.11556889116764069,"engaged":0.112053282558918,"algorithms":0.11660069972276688,"study":0.32074373960494995,"drones":0.010631960816681385,"city":0.6895884275436401,"methods":0.34474414587020874,"##shin":0.2277328372001648,"##making":0.05304143577814102,"##ha":0.02772916667163372,"yoon":0.3045981526374817,"tools":0.09832728654146194,"commons":0.30452221632003784,"enabled":0.20327648520469666,"smart":0.08543198555707932,"file":0.05286150425672531,"bibliography":5.297535681165755E-4,"ka":0.06688455492258072,"rights":0.05896950513124466,"electronic":0.17311343550682068,"decisions":0.29970282316207886,"neutrality":0.5049085021018982,"planner":0.24539904296398163,"outcome":0.11371593922376633,"informed":0.3106823265552521,"##bution":0.1041048988699913,"##ifiers":0.04675302281975746,"systematic":0.46295803785324097,"climate":0.18128998577594757,"positive":0.04865116626024246,"kw":0.34122201800346375,"transformation":0.20877434313297272,"agenda":0.03565756231546402,"evolving":0.14791782200336456,"framework":0.007431890349835157,"yong":0.0550355426967144,"cite":0.33398374915122986,"kala":0.32930788397789,"governance":0.34398671984672546,"communities":0.08535771071910858,"statistics":0.052806124091148376,"date":0.13963960111141205,"data":0.39655566215515137,"use":0.08380871266126633,"##kit":0.09065615385770798,"used":0.35450369119644165,"autonomous":0.12261320650577545,"planners":0.42163339257240295,"space":0.2670583128929138,"influence":0.2481963038444519,"automation":0.15374217927455902,"reviews":0.18399551510810852,"ma":0.16901564598083496,"publication":0.38850870728492737,"implemented":0.053558461368083954,"publishers":0.18621283769607544,"reviewed":0.17948302626609802,"links":0.04047965258359909,"brian":0.2492590993642807,"potential":0.2724534869194031,"cities":0.5510454773902893,"offset":0.4098235070705414,"resource":0.22093625366687775,"##ative":0.1652144193649292,"insights":0.006345877889543772,"author":0.1557941734790802,"kind":0.11964982002973557,"##pace":0.5548737645149231,"format":0.1797776222229004,"applicable":0.060564614832401276,"published":0.34457963705062866,"transforming":0.06379228830337524,"tool":0.03174130246043205,"important":0.21945545077323914,"license":0.060539308935403824,"efforts":0.03456439822912216,"##pro":0.2155655473470688,"task":0.2023821622133255,"202":0.22231341898441315,"techniques":0.10463304072618484,"improve":0.04888864606618881,"focused":0.0035941582173109055,"publisher":0.25538837909698486,"topic":0.017722906544804573,"harvard":0.13650839030742645,"facilitate":0.13405866920948029,"code":0.15973183512687683,"##duction":0.2874606251716614,"challenges":0.27279528975486755,"university":0.22209526598453522,"influenced":0.036248043179512024,"scientific":0.10310098528862,"contribute":0.2267485111951828,"link":0.07789286971092224,"##hra":0.30133336782455444,"integrated":0.24239039421081543,"interactions":0.15954171121120453,"##dis":0.11599010229110718,"transform":0.30501848459243774,"database":0.02429979294538498,"computing":0.022582095116376877,"contributor":0.04730186238884926,"paper":0.24984286725521088,"##4":0.05706184357404709,"influences":0.0535680390894413,"studies":0.4529181122779846,"transformed":0.05352449044585228,"department":0.2827862501144409,"value":0.4706687927246094,"##ass":0.093976229429245,"applying":0.1453428715467453,"initiative":0.09344621002674103,"nature":0.05899370089173317,"advantage":0.2895694673061371,"implementation":0.030833836644887924,"contributing":0.1328820288181305,"resources":0.12494967132806778,"approaches":0.1485711932182312,"korean":0.03067183494567871,"intelligent":0.2268957644701004,"application":0.2711690068244934,"jessica":0.15071113407611847,"activities":0.10379347205162048,"engage":0.07790189981460571,"interaction":0.0824788436293602,"challenge":0.17710502445697784,"reduction":0.01543586514890194,"timothy":0.14833040535449982,"methodology":0.24421893060207367},"dates":[{"kind":"Publication date","value":"2024-08-01"}],"source":"DSpace@MIT","title":"AI Analytics for Carbon-Neutral City Planning: A Systematic Review of Applications","source_link":"https://dspace.mit.edu/handle/1721.1/157266","content_type":["Article"],"rights":[{"description":"Creative Commons Attribution","kind":"useAndReproduction"}],"publishers":[{"name":"Multidisciplinary Digital Publishing Institute"}],"links":[{"url":"https://hdl.handle.net/1721.1/157266","kind":"Digital object URL","text":"Digital object URL"}],"contributors":[{"value":"Cong, Cong","kind":"author"},{"value":"Page, Jessica","kind":"author"},{"value":"Kwak, Yoonshin","kind":"author"},{"value":"Deal, Brian","kind":"author"},{"value":"Kalantari, Zahra","kind":"author"},{"value":"Massachusetts Institute of Technology. Department of Urban Studies and Planning","kind":"department"}],"timdex_record_id":"dspace:1721.1-157266"},"sort":[9.738817,1722470400000]},{"_index":"dspace-2026-02-09t19-23-02","_id":"dspace:1721.1-162354","_score":9.719293,"_source":{"summary":["This paper evaluates the suitability of Apache Arrow, Parquet, and ORC as formats for subsumption in an analytical DBMS. We systematically identify and explore the high-level features that are important to support efficient querying in modern OLAP DBMSs and evaluate the ability of each format to support these features. We find that each format has trade-offs that make it more or less suitable for use as a format in a DBMS and identify opportunities to more holistically co-design a unified in-memory and on-disk data representation. Notably, for certain popular machine learning tasks, none of these formats perform optimally, highlighting significant opportunities for advancing format design. Our hope is that this study can be used as a guide for system developers designing and using these formats, as well as provide the community with directions to pursue for improving these common open formats."],"timdex_provenance":{"source":"dspace","run_date":"2026-04-15","run_id":"a816f3dc-51ac-7e5f-cec8-1086ffc54274_861de409-c771-2e2c-c416-93c81a0885e3","run_record_offset":1356},"languages":["en"],"citation":"Liu, C., Pavlenko, A., Interlandi, M. et al. Data formats in analytical DBMSs: performance trade-offs and future directions. The VLDB Journal 34, 30 (2025).","file_formats":["application/pdf"],"identifiers":[{"value":"https://hdl.handle.net/1721.1/162354","kind":"uri"},{"value":"PUBLISHER_CC","kind":"mitlicense"}],"format":"electronic resource","embedding_full_record":{"authored":0.06326000392436981,"##b":0.20966780185699463,"metadata":0.06579314917325974,"##c":0.6906861066818237,"inform":0.032833367586135864,"optimal":0.25377368927001953,"##sume":0.11376846581697464,"##f":0.04081907123327255,"objects":0.1176990494132042,"##i":0.12337058782577515,"##frame":0.03737364336848259,"##l":0.12874270975589752,"##m":0.16260561347007751,"evaluation":0.08071526885032654,"##q":0.10321275144815445,"##s":0.26642757654190063,"java":0.15143220126628876,"identification":0.043341800570487976,"contribution":0.008277256041765213,"##sum":0.3802957832813263,"##ms":0.40456026792526245,"xml":0.232737734913826,"##v":0.20461979508399963,"record":0.34169715642929077,"##x":0.35603439807891846,"##ances":0.07611484080553055,"api":0.10119815170764923,"evaluated":0.0915936604142189,"publishing":0.22853311896324158,"springer":0.3735247254371643,"databases":0.21490338444709778,"using":0.05535360053181648,"#":0.0671033263206482,"ai":0.2987413704395294,"analysis":0.2460346817970276,"version":0.13080008327960968,"science":0.13931459188461304,"domain":0.13361269235610962,"institute":0.246263787150383,"evaluating":0.030079076066613197,"compression":0.12405900657176971,"archery":0.08006305992603302,"object":0.27452918887138367,"appropriate":0.16986873745918274,"@":0.04849283769726753,"sub":0.4643206000328064,"statistical":0.056589290499687195,"access":0.005683362949639559,"document":0.1359955370426178,"##type":0.08002244681119919,"cited":0.2731648087501526,"proven":0.3358120918273926,"##len":0.21029067039489746,"##des":0.199040025472641,"coding":0.05735114589333534,"default":0.07054878771305084,"journal":0.4187624454498291,"citations":0.324516236782074,"135":0.13427986204624176,"systems":0.018171120434999466,"mit":0.5386271476745605,"supports":0.14593368768692017,"##ries":0.005964689422398806,"attribute":0.07261499762535095,"##ded":0.10541872680187225,"email":0.09692370146512985,"computers":0.06100724637508392,"_":0.24417756497859955,"cc":0.10979542881250381,"34":0.018831733614206314,"ce":0.11975161731243134,"c":0.06920450925827026,"languages":0.3096389174461365,"d":0.023943200707435608,"##hema":0.18194539844989777,"dept":0.05622569099068642,"##able":0.021831020712852478,"ibm":0.12162016332149506,"v":0.41451990604400635,"##lda":0.03236616402864456,"archer":0.11155743896961212,"information":0.08152443170547485,"##ance":0.32611650228500366,"analytic":0.3894529342651367,"db":0.5389628410339355,"open":0.30259403586387634,"supported":0.2776867151260376,"publications":0.028576882556080818,"acceptable":0.05775200575590134,"##re":0.02997703291475773,"language":0.3679327070713043,"run":0.32820576429367065,"source":0.25645890831947327,"anna":0.049309488385915756,"ds":0.5970381498336792,"analytics":0.31938526034355164,"features":0.05942435562610626,"##ac":0.0555298812687397,"##mut":0.012596987187862396,"apache":0.5691919326782227,"##16":0.1906917542219162,"tim":0.5583646297454834,"liu":0.39248210191726685,"ur":0.3615259528160095,"##offs":0.3200936019420624,"programming":0.05730119347572327,"##ap":0.24668924510478973,"par":0.6054246425628662,"oracle":0.23230351507663727,"query":0.38184213638305664,"encoding":0.30492886900901794,"article":0.15887928009033203,"et":0.13222229480743408,"##cb":0.016273783519864082,"##ption":0.112815722823143,"suited":0.03173478692770004,"laboratory":0.05539393797516823,"##tri":0.03185667097568512,"##27":0.028649242594838142,"spaces":0.09074917435646057,"citing":0.17482781410217285,"exchange":0.06908046454191208,"##bm":0.09204327315092087,"support":0.30039894580841064,"vs":0.1490935981273651,"compatibility":0.10008184611797333,"useful":0.05663863569498062,"##cs":0.144036665558815,"que":0.015507410280406475,"formats":0.6839311122894287,"memory":0.26607877016067505,"analytical":0.5532273650169373,"sources":0.013308841735124588,"string":0.010156911797821522,"records":0.31750768423080444,"mass":0.07795960456132889,"recording":0.013607144355773926,"learning":0.21895013749599457,"##tp":0.08334968984127045,"representation":0.21843059360980988,"papers":0.06430764496326447,"##da":0.05158985033631325,"##41":0.00327925942838192,"content":0.3480491042137146,"##db":0.10483471304178238,"offs":0.41930633783340454,"1712":0.030306948348879814,"common":0.26655104756355286,"##38":0.010804085992276669,"authorship":0.09669502824544907,"linux":0.04003971815109253,"1718":0.022888846695423126,"1717":0.03181882202625275,"1716":0.0460241474211216,"digital":0.3252891004085541,"cipher":0.033086758106946945,"types":0.06844320893287659,"citation":0.37190183997154236,"##base":0.09430906176567078,"perform":0.11816409975290298,"##51":0.13388793170452118,"futures":0.0923713892698288,"##52":0.10562259703874588,"##53":0.005340913776308298,"##54":0.21940243244171143,"##de":0.5519673228263855,"##off":0.3553139865398407,"1722":0.08510658890008926,"1721":0.41685453057289124,"artificial":0.33655256032943726,"##46":0.014451919123530388,"pdf":0.3317619860172272,"what":0.06326655298471451,"publish":0.12108848989009857,"analyst":0.05538155511021614,"syntax":0.028879454359412193,"suitable":0.35854843258857727,"developer":0.10991670191287994,"relational":0.10851946473121643,"contributors":0.13800233602523804,"hd":0.044886454939842224,"pub":0.009274170733988285,"articles":0.015706103295087814,"86":0.026575099676847458,"applications":0.05275992676615715,"1724":0.028561556711792946,"copyright":0.108967125415802,"software":0.07586667686700821,"##wei":0.14451885223388672,"advanced":0.05741257965564728,"developers":0.004118142183870077,"prefix":0.025027096271514893,"zhang":0.08246918767690659,"type":0.2349967658519745,"repository":0.05742449313402176,"improved":0.09223189204931259,"number":0.009914202615618706,"##ifier":0.11010026186704636,"compatible":0.06838491559028625,"##listic":0.15535415709018707,"advances":0.03609071299433708,"massachusetts":0.44629615545272827,"id":0.4051918387413025,"text":0.0260288305580616,"##nse":0.11344064772129059,"efficiency":0.135295569896698,"python":0.011614164337515831,"##lice":0.16007159650325775,"inter":0.4060518741607666,"handle":0.1578368991613388,"journals":0.15433081984519958,"heidelberg":0.11487074196338654,"script":0.024793172255158424,"intelligence":0.27145013213157654,"1624":0.07035279273986816,"1623":0.33481156826019287,"filing":0.0728340819478035,"matteo":0.3645545244216919,"system":0.12195334583520889,"issn":0.012653990648686886,"anal":0.16608324646949768,"analyze":0.06071585416793823,"binary":0.006361054256558418,"suit":0.3951907157897949,"evaluate":0.21086925268173218,"hash":0.0017435505287721753,"authors":0.10221445560455322,"trading":0.3173046410083771,"server":0.1242666020989418,"semantic":0.022489970549941063,"extension":0.016913605853915215,"1086":0.09457282721996307,"commons":0.2575511336326599,"computer":0.2724320590496063,"file":0.4406164586544037,"bibliography":0.03022458404302597,"modern":0.13668183982372284,"feature":0.07021725922822952,"web":0.02617386169731617,"rights":0.09366274625062943,"electronic":0.2340630292892456,"##ability":0.1801607459783554,"berlin":0.24757257103919983,"##bution":0.06591100245714188,"##ifiers":0.07684125751256943,"efficient":0.28193122148513794,"off":0.3288807272911072,"framework":0.13764390349388123,"##ent":0.05290812626481056,"future":0.4778751730918884,"machine":0.3194677233695984,"unified":0.23386123776435852,"stored":0.08578113466501236,"yong":0.03955918177962303,"cite":0.33382564783096313,"php":0.26280125975608826,"statistics":0.019855445250868797,"date":0.3127308487892151,"data":0.7685121297836304,"arrow":0.772948682308197,"use":0.288200706243515,"arrows":0.5317402482032776,"used":0.23208676278591156,"integer":0.03136451914906502,"suits":0.13321034610271454,"space":0.2351044863462448,"chun":0.20622095465660095,"reference":0.017940489575266838,"##land":0.3995470106601715,"protocol":0.11519325524568558,"brandon":0.36556828022003174,"ma":0.050216853618621826,"publication":0.327789843082428,"host":0.21660538017749786,"publishers":0.14939634501934052,"links":0.08115195482969284,"tag":0.042355939745903015,"##ix":0.06601136177778244,"##que":0.01914374530315399,"development":0.06831243634223938,"offset":0.4688059985637665,"resource":0.2971538305282593,"kind":0.30223211646080017,"author":0.11289648711681366,"format":0.7642186284065247,"##pace":0.5418577194213867,"applicable":0.05221707001328468,"published":0.2798413634300232,"license":0.07024329900741577,"disk":0.27597349882125854,"##pro":0.15400145947933197,"directions":0.2734294533729553,"202":0.19610534608364105,"improve":0.11574501544237137,"files":0.29914751648902893,"publisher":0.29015883803367615,"header":0.05922859162092209,"code":0.17266401648521423,"##duction":0.295329749584198,"scala":0.03923822194337845,"university":0.07478907704353333,"##ducted":0.02141270413994789,"values":0.09246232360601425,"##ld":0.472296804189682,"sql":0.3778570294380188,"database":0.5726172924041748,"computing":0.09924035519361496,"contributor":0.08859466016292572,"##ko":0.21147622168064117,"paper":0.16685697436332703,"design":0.24472486972808838,"browser":0.001083766808733344,"##8":0.0796188935637474,"og":0.046550996601581573,"department":0.04782227426767349,"value":0.5165772438049316,"ol":0.4314623177051544,"##ass":0.011737906374037266,"or":1.2697066068649292,"sap":0.13873858749866486,"traded":0.13100340962409973,"performing":0.05869215726852417,"##quet":0.42965054512023926,"trader":0.06325112283229828,"trades":0.3118123710155487,"resources":0.13070796430110931,"pa":0.28829145431518555,"trade":0.61690354347229,"performance":0.49630552530288696,"application":0.2254633605480194,"##ls":0.10663583129644394,"variable":0.20136728882789612,"compliant":0.14644505083560944,"cheng":0.009740360081195831,"haynes":0.3956882059574127,"timothy":0.14257872104644775},"dates":[{"kind":"Publication date","value":"2025-03-19"}],"source":"DSpace@MIT","title":"Data formats in analytical DBMSs: performance trade-offs and future directions","related_items":[{"description":"The VLDB Journal","relationship":"host"}],"source_link":"https://dspace.mit.edu/handle/1721.1/162354","content_type":["Article"],"rights":[{"description":"Creative Commons Attribution","kind":"useAndReproduction"}],"publishers":[{"name":"Springer Berlin Heidelberg"}],"links":[{"url":"https://hdl.handle.net/1721.1/162354","kind":"Digital object URL","text":"Digital object URL"}],"contributors":[{"value":"Liu, Chunwei","kind":"author"},{"value":"Pavlenko, Anna","kind":"author"},{"value":"Interlandi, Matteo","kind":"author"},{"value":"Haynes, Brandon","kind":"author"},{"value":"Massachusetts Institute of Technology. Computer Science and Artificial Intelligence Laboratory","kind":"department"}],"timdex_record_id":"dspace:1721.1-162354"},"sort":[9.719293,1742342400000]},{"_index":"dspace-2026-02-09t19-23-02","_id":"dspace:1721.1-165230","_score":9.7108345,"_source":{"summary":["Flight phase identification (FPI) approaches that\r\napply traditional machine learning techniques are expensive to\r\nscale, difficult to generalize across platforms, and frequently\r\nunavailable in permissive or distributed training environments.\r\nWe propose a scalable, data-driven pipeline for automatic FPI\r\nusing open-source Automatic Dependent Surveillance-Broadcast\r\n(ADS-B) data, with an emphasis on cross-aircraft generalization\r\nthrough transfer learning. Leveraging ADS-B telemetry from\r\nUSAF Initial Flight Training aircraft, a neural network classifier\r\nis trained on Diamond DA-20 flight data and evaluated on Texan\r\nT-6 aircraft under zero-shot and fine-tuned transfer learning\r\nconditions. We describe a robust ADS-B preprocessing pipeline\r\nintegrating digital elevation model (DEM) data, a data labeling\r\nstrategy using unsupervised learning, and a transfer learning\r\napproach enabling adaptation across aircraft types with limited\r\nlabeled data. Our results demonstrate that transfer learning significantly\r\nimproves classification accuracy for flight phases with\r\nlimited data, highlighting the potential of ADS-B-based models\r\nto support scalable, behavior-aware airspace intelligence across\r\nheterogeneous fleets and permissive environments. This research\r\nadvances FPI capabilities for USAF training analysis and broader\r\noperational priorities in autonomy, situational awareness, and\r\ndata-driven decision support."],"timdex_provenance":{"source":"dspace","run_date":"2026-03-22","run_id":"f15b82c8-9c33-adb1-ef33-e3b19b0bee5a_749ee42b-ec50-9cc8-37ee-e235b3bcffa1","run_record_offset":3},"languages":["en_US"],"citation":"Kiefer, Jacob, Alemany, Sheila (2026-03-20): Cross-Aircraft Flight Phase Classification Using ADS-B Data and Transfer Learning. Technical Report. https://dspace.mit.edu/handle/1721.1/165230","file_formats":["application/pdf"],"identifiers":[{"value":"https://hdl.handle.net/1721.1/165230","kind":"uri"}],"subjects":[{"value":["ADS-B, flight phase detection, trajectory analysis, transfer learning, aviation analytics"],"kind":"Subject scheme not provided"}],"format":"electronic resource","embedding_full_record":{"plane":0.327323317527771,"##b":0.37748393416404724,"##f":0.18324199318885803,"objects":0.07714032381772995,"accuracy":0.3802049458026886,"texas":0.2624126076698303,"##frame":0.2078765481710434,"dem":0.3664191961288452,"analyzing":0.056507814675569534,"##q":0.029153112322092056,"##r":0.04934535548090935,"raf":0.1800212562084198,"retrieval":0.10364896059036255,"record":0.0847080796957016,"##x":0.17942027747631073,"tel":0.3122199475765228,"##ances":2.1301886590663344E-4,"knowledge":0.04317100718617439,"ad":0.41872575879096985,"af":0.11162019520998001,"tex":0.15814034640789032,"ai":0.23098541796207428,"analysis":0.3636189103126526,"-":0.2677155137062073,"adapted":0.11326386779546738,"airport":0.2887551784515381,"0":0.010377583093941212,"av":0.3121824562549591,"mcdonnell":0.018141737207770348,"##hawk":0.07721666246652603,"agile":0.10476768016815186,"wing":0.07906606793403625,"bombers":0.08238886296749115,"object":0.21176591515541077,"flight":0.8271450996398926,"statistical":0.1512524038553238,"scheme":0.2029295116662979,"cited":0.09120924025774002,"proven":0.2575123608112335,"adaptive":0.24886831641197205,"coding":0.03778305649757385,"capability":0.28460946679115295,"citations":0.24943473935127258,"acquisition":0.06868216395378113,"behavior":0.17540597915649414,"enabling":0.01905832067131996,"b":0.7945021390914917,"##train":0.1418839991092682,"learn":0.4231948256492615,"f":0.821062445640564,"##sonic":0.08698060363531113,"fly":0.29634159803390503,"r":0.2454063445329666,"##grate":0.10458781570196152,"stage":0.13219870626926422,"information":0.07304446399211884,"##ance":0.32310885190963745,"aerospace":0.29311108589172363,"##izations":0.0012437861878424883,"da":0.20922498404979706,"analytic":0.07734008133411407,"fleet":0.26504266262054443,"transferred":0.2986842095851898,"deco":0.05213594809174538,"language":0.20246359705924988,"lincolnshire":0.0593637079000473,"f1":0.23575718700885773,"ds":0.5071855783462524,"analytics":0.3400990962982178,"tim":0.4548512101173401,"airlines":0.2345527857542038,"train":0.1652452051639557,"computational":0.032296307384967804,"##try":0.15804250538349152,"aviator":0.1210118979215622,"planes":0.2757224142551422,"gps":0.033663246780633926,"encoding":0.12445726990699768,"ads":0.6522861123085022,"learnt":0.009058349765837193,"##tra":0.05399373918771744,"identifying":0.33007922768592834,"formats":0.05401812866330147,"neural":0.3721093237400055,"##pis":0.3450034558773041,"trained":0.26436060667037964,"technical":0.2027466744184494,"analytical":0.02548176795244217,"fl":0.011340937577188015,"training":0.5586438179016113,"fleets":0.07841381430625916,"capable":0.010757355950772762,"jets":0.09156147390604019,"##da":0.032988663762807846,"flown":0.07128415256738663,"transferring":0.5048041939735413,"##lab":0.07078082859516144,"behavioral":0.14552803337574005,"trainer":0.0024121811147779226,"surveillance":0.4074339270591736,"airline":0.1849549263715744,"afb":0.1493145376443863,"class":0.1879206746816635,"digital":0.4256141483783722,"capabilities":0.3105522394180298,"pilot":0.238252192735672,"identify":0.38165828585624695,"citation":0.32510140538215637,"label":0.17522859573364258,"trajectory":0.2638624310493469,"##ed":0.01922573894262314,"##de":0.4000800848007202,"horizon":0.0015272091841325164,"pdf":0.20143234729766846,"regression":0.13863980770111084,"airplane":0.3339555859565735,"analyst":0.07570115476846695,"detected":0.025865908712148666,"hd":0.06436578184366226,"##eous":0.05534256994724274,"##man":0.09181712567806244,"##ble":0.22314807772636414,"simulation":0.16747212409973145,"approach":0.32134249806404114,"tracking":0.1743800789117813,"crosses":0.17074596881866455,"nad":0.02006673254072666,"##ifier":0.26231440901756287,"navigation":0.11452538520097733,"##elli":0.01952385902404785,"imagery":0.05108343064785004,"model":0.3343983292579651,"id":0.38156795501708984,"per":0.2228415608406067,"nap":0.08270581066608429,"##missive":0.3779456615447998,"algorithm":0.19287234544754028,"sky":0.03536292538046837,"dependency":4.842617781832814E-4,"##aging":0.050706710666418076,"distributed":0.19617734849452972,"classified":0.2424139529466629,"handle":0.04359809309244156,"schemes":0.11856938898563385,"##ache":0.08581281453371048,"classification":0.5773466229438782,"crossing":0.34570860862731934,"propose":0.07769981026649475,"intelligence":0.40255168080329895,"broadcasting":0.12064145505428314,"traditional":0.15516391396522522,"analyze":0.08002284914255142,"driven":0.2707163691520691,"##ogen":0.14492687582969666,"crossed":0.34581229090690613,"algorithms":0.1989930421113968,"##gy":0.12164152413606644,"##per":0.10839126259088516,"drones":0.11529263108968735,"inference":0.037696413695812225,"air":0.31766703724861145,"##ization":0.16827194392681122,"aero":0.20904149115085602,"cycle":0.06794340163469315,"##gration":0.22000053524971008,"file":0.16187220811843872,"electronic":0.07864823937416077,"ki":0.36999744176864624,"robust":0.26237091422080994,"radar":0.3276538848876953,"machine":0.38167062401771545,"report":0.1758248209953308,"cite":0.17992758750915527,"##ration":0.09714525938034058,"codes":0.05214240029454231,"auto":0.16973452270030975,"environments":0.009488009847700596,"recognition":0.1538490355014801,"detectors":0.2597590982913971,"autonomous":0.26216644048690796,"lab":0.010193179361522198,"platforms":0.13332928717136383,"##aer":0.007053046021610498,"automation":0.24649544060230255,"fine":0.006917104125022888,"publication":0.21779265999794006,"ale":0.20102186501026154,"traffic":0.031102513894438744,"##ix":0.00157483434304595,"pilots":0.2885487377643585,"##eme":0.16557927429676056,"difficult":0.08893875032663345,"runway":0.06713844835758209,"lever":0.26676419377326965,"tool":0.05721225589513779,"coded":0.08440535515546799,"202":0.11387988179922104,"sensor":0.1148727759718895,"ni":0.009924238547682762,"detector":0.19064894318580627,"nl":0.0774017721414566,"##grating":0.17746390402317047,"leverage":0.02625182829797268,"code":0.1661587506532669,"ns":0.07815902680158615,"university":0.02989606186747551,"nu":0.0788736641407013,"technique":0.1803264170885086,"airborne":0.18447354435920715,"##ach":0.22893689572811127,"##bee":0.21813255548477173,"elevation":0.4510262906551361,"simulator":0.13531850278377533,"havilland":0.0652073547244072,"aircraft":0.665353000164032,"cross":0.7417284250259399,"automatic":0.3135499954223633,"##fly":0.022322554141283035,"application":0.14105579257011414,"tuned":0.1316758692264557,"adaptations":0.021747155115008354,"ames":0.006603383459150791,"pi":0.28047317266464233,"machines":0.01250362116843462,"##set":0.07410489022731781,"incident":0.03945603594183922,"accurate":0.29881006479263306,"depend":0.02014412172138691,"adaptation":0.1707857996225357,"echo":0.06648745387792587,"##ces":0.02262932062149048,"identification":0.5200278162956238,"##hot":0.08714259415864944,"prep":0.3260059952735901,"models":0.2482084482908249,"based":0.2405795305967331,"using":0.09748149663209915,"##naut":0.04948049783706665,"monitoring":0.049851834774017334,"airspace":0.5116061568260193,"labels":0.07254334539175034,"20":0.003619598224759102,"crossover":0.23050493001937866,"automatically":0.20638541877269745,"experiments":0.004495156928896904,"##pi":0.6445677280426025,"mig":0.05900212377309799,"##des":0.09368448704481125,"networks":0.08373016864061356,"kei":0.10064035654067993,"mit":0.46582409739494324,"situation":0.08368326723575592,"##version":0.17950744926929474,"detection":0.4346212148666382,"languages":0.13573890924453735,"decision":0.11253432929515839,"airplanes":0.2983308732509613,"simulations":0.04014856368303299,"##01":0.05685464292764664,"automated":0.32081496715545654,"lincoln":0.5353744626045227,"##pu":0.13256913423538208,"##efe":0.2113998830318451,"open":0.11679860949516296,"##ind":0.06381805986166,"tx":0.057043932378292084,"##shot":0.07646559178829193,"project":0.05300106108188629,"run":0.0333317331969738,"source":0.18904349207878113,"##ro":0.019282620400190353,"research":0.29766589403152466,"##21":0.009631079621613026,"zero":0.39043471217155457,"##cal":0.05109814926981926,"aeronautics":0.33473819494247437,"awareness":0.18369989097118378,"segment":0.015970800071954727,"jet":0.17622223496437073,"##19":0.044592346996068954,"military":0.33383557200431824,"aeronautical":0.2691512405872345,"##imi":0.19553236663341522,"ur":0.09375284612178802,"adapt":0.06748977303504944,"labeled":0.052534278482198715,"boeing":0.0757812112569809,"drone":0.051251549273729324,"technologies":0.014744002372026443,"laboratory":0.11841476708650589,"flying":0.30850717425346375,"detecting":0.04603651165962219,"demonstrate":0.01975083164870739,"support":0.10472959280014038,"##ffa":0.011855383403599262,"##ila":0.11677130311727524,"##te":0.03668559342622757,"records":0.0062113613821566105,"sheila":0.2550453245639801,"detect":0.2577579915523529,"learning":0.6050947904586792,"shot":0.18479858338832855,"##33":0.0844298005104065,"##34":0.054386645555496216,"##su":0.14862100780010223,"##ight":0.009235979057848454,"##38":0.0652979388833046,"jacob":0.3383141756057739,"##ta":0.06809775531291962,"summary":0.015219010412693024,"learned":0.2585221827030182,"airfield":0.11853575706481934,"##51":0.04587308689951897,"1721":0.30355650186538696,"artificial":0.16651064157485962,"applications":0.014015867374837399,"##nte":0.17380225658416748,"modeling":0.17204919457435608,"software":0.10647904127836227,"faa":0.3823120892047882,"multi":0.11063821613788605,"identified":0.29891395568847656,"enable":0.009346500970423222,"dependent":0.3506503403186798,"phase":0.6809138059616089,"identifies":0.14408521354198456,"method":0.13752584159374237,"classifications":0.2815910875797272,"##sing":0.24703679978847504,"force":0.211165651679039,"##cross":0.16277183592319489,"broadcast":0.31152406334877014,"methods":0.17136423289775848,"interceptor":0.020217256620526314,"phased":0.38362130522727966,"across":0.33647629618644714,"computer":0.007607245817780495,"transfers":0.3608941435813904,"labeling":0.27069777250289917,"identity":0.21566705405712128,"phases":0.5601584911346436,"cockpit":0.10423694550991058,"##ifiers":0.05209611728787422,"initial":0.2172650545835495,"pipeline":0.4802693724632263,"nasa":0.2520968019962311,"usaf":0.37407612800598145,"airbus":0.10812097787857056,"queue":0.008187898434698582,"statistics":0.0856262594461441,"date":0.07258779555559158,"diamonds":0.28526124358177185,"data":0.6807225346565247,"broadcaster":0.08821972459554672,"navy":0.001447769463993609,"nun":0.10145047307014465,"aviation":0.6543870568275452,"space":0.08886734396219254,"cloud":0.017315048724412918,"##ava":0.18706026673316956,"protocol":0.030212752521038055,"1653":0.0998312458395958,"1652":0.35583817958831787,"tag":0.0776335671544075,"potential":0.17087379097938538,"offset":0.3747822046279907,"##flight":0.31471872329711914,"resource":0.2071581333875656,"kind":0.025950495153665543,"##pace":0.45429569482803345,"format":0.10158206522464752,"published":0.17788740992546082,"##ition":0.027097929269075394,"transfer":0.7678554058074951,"##pro":0.07810728251934052,"proposed":0.02172822691500187,"techniques":0.25671204924583435,"classify":0.3323252499103546,"altitude":0.04957279935479164,"scala":0.45722994208335876,"platform":0.1886875480413437,"##oop":0.01893220655620098,"network":0.24493859708309174,"aware":0.1938502937555313,"##rove":0.13063780963420868,"lockheed":0.0876787006855011,"general":0.1439075767993927,"database":0.2651844918727875,"computing":0.015329546295106411,"##2":0.009317763149738312,"value":0.37326744198799133,"sap":0.07409115880727768,"cost":0.003585290629416704,"implementation":0.03449702635407448,"resources":0.028323328122496605,"approaches":0.32322704792022705,"diamond":0.5509471893310547,"stages":0.08748873323202133,"##ond":0.07797770947217941,"flights":0.4816899001598358,"methodology":0.09708613902330399},"dates":[{"kind":"Publication date","value":"2026-03-20"}],"source":"DSpace@MIT","title":"Cross-Aircraft Flight Phase Classification Using ADS-B Data and Transfer Learning","source_link":"https://dspace.mit.edu/handle/1721.1/165230","content_type":["Technical Report"],"links":[{"url":"https://hdl.handle.net/1721.1/165230","kind":"Digital object URL","text":"Digital object URL"}],"contributors":[{"value":"Kiefer, Jacob","kind":"author"},{"value":"Alemany, Sheila","kind":"author"},{"value":"Lincoln Laboratory","kind":"department"}],"timdex_record_id":"dspace:1721.1-165230"},"sort":[9.7108345,1773964800000]},{"_index":"dspace-2026-02-09t19-23-02","_id":"dspace:1721.1-162482","_score":9.66168,"_source":{"summary":["Automation and digitalization solutions in the field of small molecule synthesis face new challenges for chemical reaction analysis, especially in the field of high-performance liquid chromatography (HPLC). Chromatographic data remains locked in vendors' hardware and software components, limiting their potential in automated workflows and data science applications. In this work, we present an open-source Python project called MOCCA for the analysis of HPLC-DAD (photodiode array detector) raw data. MOCCA provides a comprehensive set of data analysis features, including an automated peak deconvolution routine of known signals, even if overlapped with signals of unexpected impurities or side products. We highlight the broad applicability of MOCCA in four studies: (i) a simulation study to validate MOCCA's data analysis features; (ii) a reaction kinetics study on a Knoevenagel condensation reaction demonstrating MOCCA's peak deconvolution feature; (iii) a closed-loop optimization study for the alkylation of 2-pyridone without human control during data analysis; (iv) a well plate screening of categorical reaction parameters for a novel palladium-catalyzed cyanation of aryl halides employing <i>O</i>-protected cyanohydrins. By publishing MOCCA as a Python package with this work, we envision an open-source community project for chromatographic data analysis with the potential of further advancing its scope and capabilities."],"timdex_provenance":{"source":"dspace","run_date":"2026-04-15","run_id":"a816f3dc-51ac-7e5f-cec8-1086ffc54274_861de409-c771-2e2c-c416-93c81a0885e3","run_record_offset":649},"languages":["en"],"citation":"Christian P. Haas, Maximilian Lübbesmeyer, Edward H. Jin, Matthew A. McDonald, Brent A. Koscher, Nicolas Guimond, Laura Di Rocco, Henning Kayser, Samuel Leweke, Sebastian Niedenführ, Rachel Nicholls, Emily Greeves, David M. Barber, Julius Hillenbrand, Giulio Volpin, and Klavs F. Jensen. ACS Central Science 2023 9 (2), 307-317.","file_formats":["application/pdf"],"identifiers":[{"value":"https://hdl.handle.net/1721.1/162482","kind":"uri"}],"format":"electronic resource","embedding_full_record":{"projects":0.10914545506238937,"optimal":0.08823083341121674,"##pins":0.023971229791641235,"##f":0.175813227891922,"objects":0.06735728681087494,"##i":0.0728113204240799,"liquids":0.10222774744033813,"##l":0.12143011391162872,"edwards":0.03290974348783493,"##n":0.1799146831035614,"analyzing":0.28946569561958313,"contributions":0.028890028595924377,"protected":0.27407389879226685,"screenings":0.2366718351840973,"record":0.1810608059167862,"##x":0.2180076241493225,"sci":0.049914635717868805,"scanner":0.002025132067501545,"##ances":0.0249042846262455,"ac":0.3154393434524536,"conde":0.32536041736602783,"raw":0.46547985076904297,"engineers":0.173634335398674,"al":0.33079180121421814,"analysis":0.5809611678123474,"community":0.17876774072647095,"packages":0.08731857687234879,"-":0.08258605003356934,"synthesized":0.07469440996646881,"ar":0.36741769313812256,"##graphy":0.22839364409446716,"chemical":0.5671109557151794,"science":0.2770434021949768,"domain":0.004288491327315569,"institute":0.32594114542007446,"object":0.24659587442874908,"peaking":0.11280077695846558,"@":0.10152069479227066,"spectra":0.09949986636638641,"statistical":0.06665483117103577,"##creen":0.09181294590234756,"molecules":0.29625046253204346,"cited":0.2676732540130615,"proven":0.2753150165081024,"##idium":0.07159323245286942,"citations":0.3429619371891022,"journal":0.1316508650779724,"##lization":0.015602322295308113,"##flow":0.16889040172100067,"_":0.050028759986162186,"chemistry":0.468561053276062,"ce":0.10143879055976868,"ch":0.4665687382221222,"h":0.03473366051912308,"photo":0.3831898868083954,"loops":0.08921335637569427,"cl":0.047037139534950256,"k":0.023455945774912834,"sample":0.055150341242551804,"p":0.20189863443374634,"jens":0.11967834830284119,"r":0.008775603957474232,"cy":0.3232453167438507,"information":0.0017366603715345263,"##ance":0.313345342874527,"##ano":0.3038313686847687,"analytic":0.20648744702339172,"characterization":0.025275837630033493,"novel":0.12328917533159256,"publications":0.07713576406240463,"screening":0.4678918123245239,"deco":0.4347671866416931,"di":0.13694249093532562,"##mes":0.02136147767305374,"##ane":0.01183395367115736,"language":0.25979164242744446,"##ana":0.2164652794599533,"developed":0.038301046937704086,"##rom":0.4352356195449829,"ds":0.5241784453392029,"analytics":0.2950293719768524,"analyses":0.06947588920593262,"##ac":0.10234133154153824,"tim":0.5121236443519592,"pal":0.3841400146484375,"signal":0.21217501163482666,"vendors":0.14770282804965973,"digit":0.1982204020023346,"computational":0.040227510035037994,"che":0.08055594563484192,"##anal":0.12874624133110046,"##ca":0.2468983381986618,"article":0.18027426302433014,"##aly":0.2362266629934311,"wiley":0.057154327630996704,"catalyst":0.0979207307100296,"##lav":0.28234174847602844,"formats":0.13892312347888947,"analytical":0.25842079520225525,"sources":0.10472097992897034,"decomposition":0.023595452308654785,"##pin":0.2600592076778412,"title":0.10982571542263031,"##ning":0.28290867805480957,"content":0.14512842893600464,"##cc":0.09712677448987961,"##lad":0.15209650993347168,"vol":0.4058322012424469,"society":0.13537825644016266,"##lab":0.20663794875144958,"spectroscopy":0.2505006194114685,"sourced":0.13143211603164673,"authorship":0.16396041214466095,"scope":0.14659304916858673,"##enstein":0.006050649099051952,"molecular":0.2767097055912018,"digital":0.5312503576278687,"##trom":0.16334766149520874,"maximilian":0.3867592513561249,"gi":0.15722891688346863,"capabilities":0.05089449882507324,"citation":0.40332597494125366,"peak":0.6162130236625671,"gr":0.13708975911140442,"##de":0.505196750164032,"pdf":0.26623404026031494,"berkeley":0.016726253554224968,"publish":0.1102289929986,"##chrome":0.08514109253883362,"analyst":0.2618616223335266,"well":0.2102104276418686,"contributors":0.16998876631259918,"hd":0.02340606600046158,"comprehensive":0.04589812830090523,"##dr":0.28509756922721863,"copyright":0.12353650480508804,"##oes":7.9118408029899E-4,"advanced":0.01678680069744587,"simulation":0.2730439305305481,"hp":0.590685248374939,"##llation":0.03223777562379837,"##fc":0.07987811416387558,"##ee":0.31010106205940247,"number":0.05173585191369057,"##ifier":0.09576612710952759,"##egorical":0.17738132178783417,"dna":0.17516329884529114,"##eyer":0.12665165960788727,"##en":0.25548887252807617,"##metric":0.05193796008825302,"id":0.29377222061157227,"text":0.007275140844285488,"validation":0.04211266338825226,"flow":0.019900869578123093,"algorithm":0.169870063662529,"python":0.6159080862998962,"plates":0.17928555607795715,"testing":0.03925369307398796,"handle":0.058197032660245895,"peaks":0.4017167389392853,"script":0.13071738183498383,"##ode":0.06055004522204399,"bosch":0.05950118228793144,"field":0.08493354171514511,"anal":0.25034642219543457,"analyze":0.335516095161438,"opens":0.20825044810771942,"gui":0.369405597448349,"arrays":0.20244726538658142,"authors":0.18514612317085266,"algorithms":0.13643108308315277,"##idon":0.24074862897396088,"##urity":0.04096322879195213,"plate":0.3375162184238434,"1086":0.08064723014831543,"##ization":0.22635126113891602,"valid":0.16142308712005615,"file":0.256416916847229,"bibliography":0.006614206358790398,"electronic":0.19632962346076965,"synthesis":0.33114373683929443,"##age":0.32881250977516174,"##hy":0.3027333617210388,"product":0.010623679496347904,"kn":0.3498324155807495,"ko":0.3548291325569153,"helmut":0.10421184450387955,"techno":0.004487012512981892,"nichols":0.07196025550365448,"##analysis":0.1691296249628067,"peek":0.014557001180946827,"overlapping":0.09740683436393738,"machine":0.01115298829972744,"cite":0.353221595287323,"##hr":0.11316099017858505,"307":0.024804839864373207,"##ration":0.01198144443333149,"kinetic":0.34045249223709106,"screened":0.1724023073911667,"fontaine":0.022143281996250153,"auto":0.14873544871807098,"##ene":0.06518734246492386,"##vos":0.05512682721018791,"use":0.0781911164522171,"screen":0.3769725561141968,"edward":0.23299692571163177,"detectors":0.41270679235458374,"lab":0.07544619590044022,"photos":0.14586840569972992,"##aer":0.04058179259300232,"##bility":0.03675847128033638,"automation":0.5323476791381836,"solution":0.2141130119562149,"publication":0.35873091220855713,"host":0.09491993486881256,"chloride":0.08415001630783081,"links":0.054402898997068405,"locked":0.3369487524032593,"##ium":0.27187803387641907,"phosphorus":0.07392706722021103,"##ix":0.06535351276397705,"matthew":0.17563612759113312,"##metry":0.0635732039809227,"mo":0.8616673350334167,"author":0.28085172176361084,"tool":0.1194043755531311,"synth":0.18927060067653656,"202":0.10471870005130768,"catalytic":0.14523141086101532,"sensor":0.10847824066877365,"ni":0.33609509468078613,"detector":0.4078851044178009,"harvard":0.07861283421516418,"code":0.23152166604995728,"patent":0.001837418763898313,"university":0.18393708765506744,"##lc":0.42467308044433594,"##dio":0.26785415410995483,"department":0.26675423979759216,"##eki":0.029474448412656784,"##ky":0.25890693068504333,"chemist":0.10198456048965454,"##eke":0.20598115026950836,"kay":0.34893858432769775,"simulator":0.06322409212589264,"##screen":0.06487827003002167,"automatic":0.14141277968883514,"control":0.001406440045684576,"compound":0.051112182438373566,"probe":0.11902287602424622,"##yre":0.03887487202882767,"application":0.19145192205905914,"##lu":0.10729756951332092,"##graph":0.26395654678344727,"##ser":0.2749210298061371,"authored":0.14071188867092133,"##ometer":0.030127130448818207,"##urities":0.18811866641044617,"sequencing":0.04717058688402176,"contribution":0.12509655952453613,"##hot":0.06713119149208069,"api":0.06208544597029686,"chemicals":0.269120454788208,"publishing":0.2432117760181427,"lew":0.2440883219242096,"app":0.10448767989873886,"nicholas":0.2155216932296753,"##oe":0.2717418074607849,"sebastian":0.27399933338165283,"##ns":0.1758842021226883,"perrin":0.017750147730112076,"processing":0.01012483797967434,"molecule":0.331489622592926,"##bbe":0.23803015053272247,"##sch":0.07848741859197617,"experiments":0.141098752617836,"automatically":0.10355868935585022,"##meter":0.08155610412359238,"##des":0.11333120614290237,"jensen":0.49234700202941895,"mcdonald":0.46689724922180176,"routine":0.04860897734761238,"sg":0.02304757758975029,"##ation":0.16072390973567963,"christian":0.37477585673332214,"vendor":0.3030058741569519,"purification":0.10767142474651337,"mit":0.48413512110710144,"samuel":0.3479236662387848,"##cca":0.531439483165741,"detection":0.2987443506717682,"reaction":0.6315406560897827,"languages":0.1758996993303299,"dept":0.19729290902614594,"simulations":0.15985120832920074,"##ins":0.07848533242940903,"##00":0.07465515285730362,"controlled":0.004284488502889872,"hill":0.2559320628643036,"##sche":0.1851508915424347,"##01":0.17352838814258575,"automated":0.48101645708084106,"rachel":0.30173489451408386,"closed":0.23974910378456116,"reactions":0.5091637372970581,"open":0.6784471273422241,"##re":0.07669492065906525,"project":0.4932900667190552,"run":0.1954246312379837,"source":0.5131348371505737,"##ees":0.09412546455860138,"challenging":0.032937124371528625,"research":0.06172395497560501,"##lysis":0.011948872357606888,"##21":0.004732798784971237,"sciences":0.010372467339038849,"features":0.12870627641677856,"reacts":0.08676116168498993,"hal":0.3608855605125427,"##16":0.14915157854557037,"neutron":0.06880778074264526,"loop":0.3138979375362396,"cambridge":0.056028418242931366,"##imi":0.30685871839523315,"ur":0.2976837754249573,"tech":0.02262232080101967,"solutions":0.23897676169872284,"mole":0.2982817590236664,"##tion":0.1973220854997635,"##sm":0.13273099064826965,"engineering":0.36624401807785034,"##ating":0.023260729387402534,"technologies":0.03530821576714516,"##ides":0.08593841642141342,"reactive":0.27319541573524475,"overlap":0.22571603953838348,"signals":0.2216399908065796,"laboratory":0.06977687776088715,"##27":0.01861575059592724,"##ede":0.2400558590888977,"##tions":0.06306760758161545,"citing":0.135920450091362,"##ves":0.25780409574508667,"##mate":0.06864428520202637,"parameters":0.1944338083267212,"64":0.0031260382384061813,"##ven":0.20707806944847107,"analysts":0.12954162061214447,"records":0.100505031645298,"scientist":0.04187177121639252,"mass":0.03442668169736862,"father":0.009606107138097286,"rocco":0.32151445746421814,"detect":0.16543623805046082,"##40":0.03574544936418533,"##41":0.055289458483457565,"central":0.4225306808948517,"linux":0.05836924910545349,"haas":0.5348629951477051,"1717":0.0218258835375309,"1716":0.011376316659152508,"summary":0.023603888228535652,"##mond":0.1906675100326538,"locking":0.02884717471897602,"technology":0.09097210317850113,"##51":0.04084926098585129,"engineer":0.20022691786289215,"1722":0.061175230890512466,"1721":0.4015094041824341,"applications":0.2020692676305771,"brent":0.17624899744987488,"software":0.49674707651138306,"##vo":0.300221711397171,"react":0.33801698684692383,"program":0.15005458891391754,"repository":0.09972896426916122,"##vs":0.016362613067030907,"jin":0.28682658076286316,"hen":0.4753245711326599,"optimization":0.4308759272098541,"nicolas":0.3170417547225952,"massachusetts":0.4365416169166565,"1618":0.009568927809596062,"instrumentation":0.006470929365605116,"hardware":0.1447049230337143,"##lica":0.15368923544883728,"julius":0.3188163638114929,"method":0.07506859302520752,"simulated":0.005866598337888718,"##tech":0.19263190031051636,"1624":0.36339178681373596,"valuable":0.10494717210531235,"study":0.18275956809520721,"methods":0.06692494451999664,"##hes":0.03186068311333656,"cobalt":0.052701614797115326,"isotope":0.15622766315937042,"tools":0.07252149283885956,"commons":0.2436729073524475,"nick":0.1590053290128708,"geo":0.018277782946825027,"##graphic":0.2939472198486328,"feature":0.17802369594573975,"screens":0.14558027684688568,"barber":0.3900335431098938,"##gram":0.0714162290096283,"##vate":0.013553030788898468,"##bution":0.014338396489620209,"##yl":0.25308093428611755,"##ifiers":0.05411512032151222,"##cala":0.010039492510259151,"##yr":0.2732725441455841,"##lation":0.2727527320384979,"liquid":0.49843525886535645,"yong":0.0038222954608500004,"small":0.37524423003196716,"##ulio":0.22204338014125824,"date":0.21555747091770172,"data":0.8183135986328125,"dad":0.4705299735069275,"nicholls":0.4501056671142578,"space":0.16691286861896515,"spec":0.040791332721710205,"reference":0.007141203619539738,"1652":0.019288841634988785,"publishers":0.07127825915813446,"robots":0.024891898036003113,"potential":0.23139850795269012,"package":0.31911900639533997,"offset":0.3510378897190094,"resource":0.23248012363910675,"kind":0.16756442189216614,"##pace":0.49072831869125366,"format":0.23737260699272156,"opened":0.16193094849586487,"published":0.28981277346611023,"##pro":0.21785274147987366,"##ide":0.1334296464920044,"publisher":0.24062983691692352,"##zer":0.039862051606178284,"files":0.024187743663787842,"who":0.06305094063282013,"##ato":0.2779949903488159,"challenges":0.3034052550792694,"##duction":0.29332664608955383,"unexpected":0.11760217696428299,"reactor":0.15944677591323853,"##zed":0.13110053539276123,"values":0.10069908946752548,"scientific":0.0941481664776802,"link":0.08465072512626648,"emily":0.11495236307382584,"##ate":0.04325370118021965,"imp":0.18478964269161224,"platform":0.0030408964958041906,"##ata":0.0023984932340681553,"database":0.2722652852535248,"##2":0.10677771270275116,"contributor":0.14785975217819214,"##3":0.060234010219573975,"array":0.42135804891586304,"cat":0.19325263798236847,"##8":0.11743713170289993,"studies":0.0010371580719947815,"david":0.08721303939819336,"value":0.6636805534362793,"sam":0.08709872514009476,"##ass":0.09347686916589737,"chromosome":0.1426510363817215,"##dium":0.032257337123155594,"##brand":0.3050648272037506,"resources":0.040620964020490646,"performance":0.17556723952293396,"variable":0.01606391742825508,"challenge":0.1987987607717514,"timothy":0.12652117013931274,"novak":0.008132821880280972,"##chemical":0.1541735827922821,"methodology":0.04617017135024071},"dates":[{"kind":"Publication date","value":"2023-02-09"}],"source":"DSpace@MIT","title":"Open-Source Chromatographic Data Analysis for Reaction Optimization and Screening","related_items":[{"description":"ACS Central Science","relationship":"host"}],"source_link":"https://dspace.mit.edu/handle/1721.1/162482","content_type":["Article"],"rights":[{"description":"Creative Commons Attribution","kind":"useAndReproduction"}],"publishers":[{"name":"American Chemical Society"}],"links":[{"url":"https://hdl.handle.net/1721.1/162482","kind":"Digital object URL","text":"Digital object URL"}],"contributors":[{"value":"Haas, Christian P","kind":"author"},{"value":"Lübbesmeyer, Maximilian","kind":"author"},{"value":"Jin, Edward H","kind":"author"},{"value":"McDonald, Matthew A","kind":"author"},{"value":"Koscher, Brent A","kind":"author"},{"value":"Guimond, Nicolas","kind":"author"},{"value":"Di Rocco, Laura","kind":"author"},{"value":"Kayser, Henning","kind":"author"},{"value":"Leweke, Samuel","kind":"author"},{"value":"Niedenführ, Sebastian","kind":"author"},{"value":"Nicholls, Rachel","kind":"author"},{"value":"Greeves, Emily","kind":"author"},{"value":"Barber, David M","kind":"author"},{"value":"Hillenbrand, Julius","kind":"author"},{"value":"Volpin, Giulio","kind":"author"},{"value":"Jensen, Klavs F","kind":"author"},{"value":"Massachusetts Institute of Technology. Department of Chemical Engineering","kind":"department"}],"timdex_record_id":"dspace:1721.1-162482"},"sort":[9.66168,1675900800000]},{"_index":"dspace-2026-02-09t19-23-02","_id":"dspace:1721.1-155775","_score":9.566903,"_source":{"summary":["Causal analysis is an essential lens for understanding complex system dynamics in domains as varied as medicine, economics and law. Computer systems are often similarly complex, but much of the information about them is only available in long, messy, semi-structured log files. This demo presents Sawmill, an open-source system that makes it possible to extract causal conclusions from log files. Sawmill employs methods drawn from the areas of data transformation, cleaning, and extraction in order to transform logs into a representation amenable to causal analysis. It gives log-derived variables human-understandable names and distills the information present in a log file around a user's chosen causal units (e.g. users or machines), generating appropriate aggregated variables for each causal unit. It then leverages original algorithms to efficiently use this representation for the novel process of Exploration-based Causal Discovery - the task of constructing a sufficient causal model of the system from available data. Users can engage with this process via an interactive interface, ultimately making causal inference possible using off-the-shelf tools. SIGMOD'24 participants will be able to use Sawmill to efficiently answer causal questions about logs. We will guide attendees through the process of quantifying the impact of parameter tuning on query latency using real-world PostgreSQL server logs, before letting them test Sawmill on additional logs with known causal effects but varying difficulty. A companion video for this submission is available online."],"timdex_provenance":{"source":"dspace","run_date":"2026-03-01","run_id":"3b5fabfb-9ee6-7cac-94a6-3b70ba14679d_7abd3cf1-9ede-4d69-259a-9fc8edfb66a5","run_record_offset":417},"languages":["en"],"citation":"Markakis, Markos, Chen, An Bo, Youngmann, Brit, Gao, Trinity, Zhang, Ziyu et al. 2024. \"Sawmill: From Logs to Causal Diagnosis of Large Systems.\"","file_formats":["application/pdf"],"identifiers":[{"value":"979-8-4007-0422-2","kind":"isbn"},{"value":"https://hdl.handle.net/1721.1/155775","kind":"uri"},{"value":"PUBLISHER_CC","kind":"mitlicense"}],"format":"electronic resource","embedding_full_record":{"objects":0.09511005133390427,"##i":0.11951585859060287,"##are":0.32475051283836365,"##frame":0.04022488370537758,"##l":0.1799229383468628,"##m":0.2769913971424103,"extracted":0.2054516077041626,"analyzing":0.24941237270832062,"##q":0.2752539813518524,"contributions":0.01756170764565468,"##u":0.010006574913859367,"retrieval":0.0990370661020279,"complex":0.3158094584941864,"rana":0.17616486549377441,"record":0.13426344096660614,"##x":0.25639477372169495,"sci":0.13833248615264893,"understanding":0.2414982169866562,"##ances":0.10694095492362976,"diagnostic":0.3792780339717865,"ac":0.3823365569114685,"lenses":0.04824139177799225,"#":0.007743679918348789,"attendees":0.14701120555400848,"ai":0.31962886452674866,"*":0.029212167486548424,"analysis":0.6374306678771973,"am":0.10589560121297836,"mill":0.0669935941696167,"submitted":0.036686014384031296,"##sti":0.17248721420764923,"sawmill":0.6797003149986267,"domain":0.31111660599708557,"science":0.2512257397174835,"institute":0.28624024987220764,"extracts":0.050517503172159195,"object":0.2353523075580597,"@":0.11403582990169525,"statistical":0.20331305265426636,"forest":0.0770525187253952,"cited":0.2583301067352295,"proven":0.3308786153793335,"bo":0.07630588859319687,"cleansing":0.005739674903452396,"coding":0.05457726866006851,"citations":0.3345428705215454,"journal":0.1415475606918335,"systems":0.36695802211761475,"peter":0.09869211912155151,"wikipedia":0.013238338753581047,"huang":0.028941571712493896,"computers":0.20091301202774048,"_":0.1511131376028061,"cc":0.1349363476037979,"d":0.01833825744688511,"possible":0.10480118542909622,"##able":7.742084562778473E-4,"information":0.3828441798686981,"z":0.2348286360502243,"##ance":0.3558690845966339,"analytic":0.2827405333518982,"dia":0.08663709461688995,"novel":0.14799141883850098,"db":0.1472979336977005,"essential":0.21390187740325928,"publications":0.039555810391902924,"represent":0.013002763502299786,"di":0.036587346345186234,"questions":0.24846360087394714,"##and":0.06475136429071426,"language":0.2547367811203003,"##eve":0.03421667218208313,"ds":0.5653846263885498,"analytics":0.31641653180122375,"chinese":0.091458760201931,"##ab":0.0151399876922369,"post":0.3501240611076355,"tim":0.5438323020935059,"##aj":0.015588507987558842,"##ao":0.022220483049750328,"computational":0.14846882224082947,"test":9.350223117507994E-4,"##anal":0.05695657059550285,"encoding":0.01997522823512554,"users":0.2498849481344223,"article":0.20435792207717896,"et":0.12998686730861664,"shelf":0.04571443423628807,"##bf":0.15524840354919434,"labs":0.05928795412182808,"##tri":0.12931449711322784,"useful":0.09044960886240005,"formats":0.2067406326532364,"analytical":0.2845112681388855,"sources":0.10721775889396667,"companion":0.31763872504234314,"young":0.20163024961948395,"aggregation":0.16589121520519257,"lens":0.38891109824180603,"interface":0.07797753065824509,"title":0.04133192077279091,"representation":0.2869631350040436,"content":0.20982952415943146,"random":0.011379106901586056,"##lab":0.1286359578371048,"sourced":0.12433413416147232,"authorship":0.19200891256332397,"##usa":0.17322373390197754,"digital":0.32669657468795776,"##aki":0.32560569047927856,"##du":0.016986150294542313,"lumber":0.2812316119670868,"citation":0.3945282995700836,"michael":0.14371536672115326,"##de":0.503119945526123,"pdf":0.313201367855072,"berkeley":0.04772103950381279,"china":0.038056328892707825,"management":0.04646965488791466,"regression":0.14299707114696503,"publish":0.12416762113571167,"coffee":0.07767703384160995,"interpret":0.011177843436598778,"analyst":0.33858102560043335,"##ncy":0.21338008344173431,"contributors":0.18139150738716125,"hd":0.09619414806365967,"articles":0.020727258175611496,"copyright":0.07433050125837326,"##man":0.05410414934158325,"##ble":0.14574626088142395,"simulation":0.009899108670651913,"answers":0.14293332397937775,"##llation":0.08924099057912827,"shah":0.2959390878677368,"zhang":0.39158332347869873,"convert":0.07207269221544266,"construct":0.03126354515552521,"tracking":0.030161578208208084,"number":0.029543893411755562,"##ifier":0.13168606162071228,"thesis":0.02740243263542652,"model":0.3578197956085205,"id":0.36097896099090576,"text":0.011223549954593182,"algorithm":0.264199823141098,"##ods":0.23168152570724487,"large":0.5514488816261292,"testing":0.07516885548830032,"understand":0.25200343132019043,"handle":0.09774933755397797,"intel":0.04071390628814697,"intelligence":0.3519522249698639,"system":0.38166069984436035,"anal":0.23969613015651703,"analyze":0.30991047620773315,"explorer":0.17513765394687653,"diagnosed":0.2357434332370758,"authors":0.20870846509933472,"algorithms":0.2900908589363098,"server":0.2795649468898773,"semantic":0.03291984647512436,"inference":0.3992345333099365,"file":0.45878705382347107,"brit":0.1785632073879242,"##gm":0.344020277261734,"rights":0.07616432011127472,"electronic":0.2436634749174118,"417":0.1058586984872818,"quan":0.12337619066238403,"question":0.05665556713938713,"##analysis":0.06457606703042984,"marko":0.39926108717918396,"framework":0.06179994344711304,"##ent":0.08163797855377197,"discovery":0.39044591784477234,"machine":0.14617349207401276,"cite":0.3389713168144226,"php":0.12438205629587173,"logic":0.02117622084915638,"trinity":0.2905224859714508,"##iy":0.13157731294631958,"##gre":0.39530789852142334,"##ena":0.1446092575788498,"use":0.12789390981197357,"bail":0.2557239234447479,"lab":0.18336567282676697,"chun":0.25242361426353455,"hacking":0.015483792871236801,"ma":0.06990033388137817,"publication":0.3619387447834015,"sufficient":0.05160260573029518,"ibrahim":0.36001744866371155,"links":0.07644150406122208,"international":0.16947877407073975,"logs":0.7275549173355103,"##ix":0.046848393976688385,"constructing":0.16412833333015442,"author":0.2903103530406952,"diagnosis":0.5472230911254883,"domains":0.2869919240474701,"tool":0.2762419283390045,"license":0.04567508399486542,"unit":0.28691643476486206,"task":0.14614611864089966,"202":0.33141231536865234,"cleanup":0.09686161577701569,"harvard":0.06071961298584938,"leverage":0.010211851447820663,"nexus":0.07092396914958954,"code":0.1663767546415329,"university":0.1755591332912445,"##ducted":0.03060460463166237,"units":0.21957096457481384,"mess":0.08620399981737137,"##eving":0.01576552912592888,"demo":0.3773340582847595,"sql":0.2652525305747986,"transform":0.23411515355110168,"##bek":0.2502918243408203,"transformed":0.03135039284825325,"department":0.09602038562297821,"economist":0.041880637407302856,"intelligent":0.01764330454170704,"cyber":0.006556750740855932,"application":0.16528692841529846,"tuned":0.16378985345363617,"##gno":0.2560446560382843,"##ls":9.569376125000417E-4,"machines":0.03476886823773384,"##set":0.05552598834037781,"hypothesis":0.07689028233289719,"authored":0.19343602657318115,"inform":0.08644253760576248,"dynamics":0.2803358733654022,"contribution":0.12693160772323608,"identification":0.10968203842639923,"java":0.09228399395942688,"api":0.0016418487066403031,"publishing":0.2390449196100235,"models":0.20030346512794495,"based":0.19873781502246857,"using":0.1005774438381195,"tuning":0.25858375430107117,"##od":0.382925420999527,"theorem":0.02403865195810795,"processing":0.015430350787937641,"jiang":0.046089816838502884,"complexity":0.09261192381381989,"conference":0.26145824790000916,"document":0.034500185400247574,"experiments":0.004315557423979044,"##des":0.18952274322509766,"sa":0.2087729275226593,"si":0.4236755967140198,"mit":0.5612584352493286,"structured":0.16593438386917114,"##ded":0.0545000322163105,"email":0.04451208561658859,"participants":0.15815198421478271,"variables":0.3226656913757324,"detection":0.19346259534358978,"discovering":0.043695710599422455,"languages":0.17410776019096375,"##hema":0.07056684792041779,"dept":0.06881973147392273,"diagram":0.053180526942014694,"##01":0.0328918993473053,"ibm":0.08593420684337616,"open":0.31166335940361023,"##re":0.028308764100074768,"project":0.096180759370327,"run":0.20651006698608398,"source":0.3586304783821106,"research":0.10556594282388687,"participant":0.03646359220147133,"##21":0.011525760404765606,"155":0.38991889357566833,"late":0.22499091923236847,"liu":0.30257856845855713,"dynamic":0.1605532467365265,"wood":0.09828320145606995,"cambridge":0.03449929133057594,"ur":0.29240408539772034,"generate":0.06819329410791397,"oracle":0.05862993746995926,"query":0.3135083019733429,"##22":0.12494085729122162,"technologies":0.009909134358167648,"extract":0.41216498613357544,"##25":0.08574289083480835,"laboratory":0.20341065526008606,"converted":0.021132558584213257,"transformations":0.0039076791144907475,"##ede":0.04436572641134262,"citing":0.1804054230451584,"1707":0.04828681796789169,"parameters":0.19380691647529602,"analysts":0.11425205320119858,"submit":0.03163759782910347,"records":0.07518982887268066,"scientist":0.005422065034508705,"isbn":0.2052183598279953,"mass":0.12585553526878357,"generating":0.1412256360054016,"derivative":0.034353092312812805,"video":0.13089138269424438,"conclusion":0.15700408816337585,"1712":0.026561535894870758,"gao":0.3686464726924896,"linux":0.08394873887300491,"causal":0.6886893510818481,"1718":0.0793316587805748,"1717":0.12253490835428238,"haas":0.02443712390959263,"1716":0.1503589153289795,"derived":0.4361056387424469,"1715":0.025975655764341354,"summary":0.07013797014951706,"technology":0.10906684398651123,"##51":0.005034910514950752,"1722":0.15083201229572296,"xi":0.07078322768211365,"1721":0.5179929733276367,"artificial":0.39025887846946716,"1720":0.04848621040582657,"what":0.045233018696308136,"xu":0.02692304365336895,"mark":0.2966872453689575,"1724":0.08703191578388214,"modeling":0.14928944408893585,"software":0.2077130526304245,"##wei":0.19744697213172913,"reasoning":0.0030406706500798464,"interactive":0.22098657488822937,"repository":0.06301640719175339,"##out":0.11534854024648666,"massachusetts":0.4846636652946472,"timber":0.2554995119571686,"##nse":0.09507014602422714,"97":0.07005196809768677,"transformers":0.019204948097467422,"method":0.2700064182281494,"##lice":0.16640277206897736,"conclusions":0.25522175431251526,"##tech":0.08471938967704773,"extraction":0.36913856863975525,"##75":0.033762071281671524,"creative":0.009402437135577202,"filing":0.0401427261531353,"logging":0.5575519800186157,"demos":0.311291366815567,"log":0.8597608208656311,"methods":0.2662981450557709,"tools":0.28393352031707764,"commons":0.2621326744556427,"derive":0.10470431298017502,"computer":0.37848201394081116,"semi":0.27612900733947754,"##bution":0.06391923129558563,"##ifiers":0.09712900966405869,"explore":0.06523439288139343,"abstract":0.0011752931168302894,"transformation":0.2681013345718384,"##mann":0.2983715534210205,"##lls":0.04443737119436264,"yong":0.09851213544607162,"submission":0.2222282886505127,"chan":0.05488675460219383,"economic":0.009434144012629986,"##lla":0.15044429898262024,"statistics":0.14591817557811737,"date":0.2395564466714859,"data":0.6234789490699768,"transforms":0.1253463327884674,"##kit":0.07795561105012894,"used":0.021904094144701958,"space":0.16954267024993896,"reference":0.02688394859433174,"publishers":0.10587123036384583,"from":0.12697942554950714,"tag":0.025926725938916206,"discover":0.11677061766386032,"exploration":0.2069137692451477,"offset":0.36872994899749756,"resource":0.29616522789001465,"kind":0.2120722383260727,"cleaner":0.014085683040320873,"##pace":0.528937816619873,"format":0.27948620915412903,"published":0.29756075143814087,"mining":0.007965129800140858,"messy":0.22586220502853394,"##pro":0.24529705941677094,"fraud":0.028113247826695442,"techniques":0.019344689324498177,"files":0.4295888841152191,"publisher":0.26041558384895325,"topic":0.002231106162071228,"largest":0.04659494757652283,"##duction":0.36024829745292664,"scientific":0.012176662683486938,"link":0.09439817070960999,"caf":0.49000948667526245,"tune":0.14324969053268433,"##oop":0.00604228675365448,"aggregate":0.3404524624347687,"database":0.26806533336639404,"computing":0.2276461124420166,"contributor":0.13811904191970825,"servers":0.03775390610098839,"##4":0.28979241847991943,"parameter":0.2291731834411621,"##7":0.09083980321884155,"##9":0.05904914811253548,"value":0.5855489373207092,"##ass":0.0911247581243515,"chen":0.4158998727798462,"cleaning":0.245879128575325,"process":0.17895683646202087,"sap":0.07587181776762009,"resources":0.1743272840976715,"clean":0.08936330676078796,"economics":0.19645600020885468,"variable":0.3385172486305237,"investigation":0.015540082938969135,"cheng":0.10278815031051636,"derivation":0.023169487714767456,"user":0.20777735114097595,"timothy":0.182199627161026,"methodology":0.2067672312259674},"dates":[{"kind":"Publication date","value":"2024-06-09"}],"source":"DSpace@MIT","title":"Sawmill: From Logs to Causal Diagnosis of Large Systems","source_link":"https://dspace.mit.edu/handle/1721.1/155775","content_type":["Article"],"rights":[{"description":"Creative Commons Attribution","kind":"useAndReproduction"}],"publishers":[{"name":"ACM|Companion of the 2024 International Conference on Management of Data"}],"links":[{"url":"https://hdl.handle.net/1721.1/155775","kind":"Digital object URL","text":"Digital object URL"}],"contributors":[{"value":"Markakis, Markos","kind":"author"},{"value":"Chen, An Bo","kind":"author"},{"value":"Youngmann, Brit","kind":"author"},{"value":"Gao, Trinity","kind":"author"},{"value":"Zhang, Ziyu","kind":"author"},{"value":"Shahout, Rana","kind":"author"},{"value":"Chen, Peter Baile","kind":"author"},{"value":"Liu, Chunwei","kind":"author"},{"value":"Sabek, Ibrahim","kind":"author"},{"value":"Cafarella, Michael","kind":"author"},{"value":"Massachusetts Institute of Technology. Computer Science and Artificial Intelligence Laboratory","kind":"department"}],"timdex_record_id":"dspace:1721.1-155775"},"sort":[9.566903,1717891200000]},{"_index":"dspace-2026-02-09t19-23-02","_id":"dspace:1721.1-155538","_score":9.546787,"_source":{"summary":["To improve the performance of scanning and filtering, modern analytic data systems such as Amazon Redshift and Databricks Delta Lake give users the ability to sort a table using a Z-order, which maps each row to a \"Z-value\" by interleaving the binary representations of the row's attributes, then sorts rows by their Z-values. These Z-order layouts essentially sort the table by multiple columns simultaneously and can achieve superior performance to single-column sort orders when the user's queries filter over multiple columns. However, the user shoulders the burden of manually selecting the columns to include in the Z-order, and a poor choice of columns can significantly degrade performance. Furthermore, these systems treat all columns included in the Z-order as equally important, which often does not result in the best performance due to the unequal impact that different columns have on query performance. In this work, we investigate the performance impact of using Z-orders that place unequal importance on columns: instead of using an equal number of bits from each column in the Z-value interleaving, we allow unequal bit allocation. We introduce a technique that uses Bayesian optimization to automatically learn the best bit allocation for a Z-order layout on a given dataset and query workload. Z-order layouts using our learned bit allocations outperform equal-bit Z-orders by up to 1.6× in query runtime and up to 2× in rows scanned."],"timdex_provenance":{"source":"dspace","run_date":"2026-03-01","run_id":"3b5fabfb-9ee6-7cac-94a6-3b70ba14679d_7abd3cf1-9ede-4d69-259a-9fc8edfb66a5","run_record_offset":190},"languages":["en"],"citation":"Gao, Jenny, Ding, Jialin, Sudhir, Sivaprasad and Madden, Samuel. 2024. \"Learning Bit Allocations for Z-Order Layouts in Analytic Data Systems.\"","file_formats":["application/pdf"],"identifiers":[{"value":"979-8-4007-0680-6","kind":"isbn"},{"value":"https://hdl.handle.net/1721.1/155538","kind":"uri"},{"value":"PUBLISHER_CC","kind":"mitlicense"}],"format":"electronic resource","embedding_full_record":{"authored":0.05578102916479111,"##b":0.014444692060351372,"inform":2.1505200129467994E-4,"optimal":0.17316299676895142,"objects":0.0671735480427742,"delta":0.6876546144485474,"##i":0.02227931283414364,"##frame":0.0717260017991066,"##m":0.09588968753814697,"##q":0.25499260425567627,"java":0.15083090960979462,"##s":0.07127928733825684,"ssr":0.02362414263188839,"scanned":0.3068147301673889,"retrieval":0.03403192013502121,"record":0.1960032433271408,"scanner":0.29808351397514343,"##x":0.19906944036483765,"##z":0.1327892392873764,"bay":0.4908413887023926,"sorts":0.4239387810230255,"filtering":0.32482844591140747,"publishing":0.2059982568025589,"databases":0.1728879064321518,"ac":0.2709139585494995,"using":0.18511657416820526,"#":0.03002086468040943,"impact":0.24948494136333466,"ai":0.2780439257621765,"analysis":0.10176615417003632,"warehouse":0.04148557409644127,"-":0.2758358418941498,"each":0.18442919850349426,"bucket":0.03977382928133011,"sorted":0.38360923528671265,"selection":0.08155601471662521,"highest":0.07031437754631042,"##lake":0.21804291009902954,"aw":0.08352666348218918,"reds":0.4630526900291443,"science":0.12725025415420532,"domain":0.02692299708724022,"processing":0.018912484869360924,"institute":0.16611535847187042,"object":0.20230011641979218,"statistical":0.00863201729953289,"sud":0.2585204243659973,"scanning":0.42588716745376587,"ordering":0.4023417532444,"achieve":0.17950108647346497,"automatically":0.23763470351696014,"##type":0.0540403388440609,"bi":0.012044049799442291,"scan":0.3306286931037903,"cited":0.14251983165740967,"##quitable":0.03733164817094803,"proven":0.23267020285129547,"##des":0.11889161169528961,"how":0.06791271269321442,"citations":0.25011157989501953,"256":0.0818248763680458,"journal":0.05310331657528877,"systems":0.18453262746334076,"##lea":0.23476523160934448,"si":0.23013634979724884,"does":0.09399960190057755,"259":0.002194111468270421,"by":0.06105552613735199,"mit":0.5219647288322449,"##ries":0.1118418350815773,"samuel":0.35218992829322815,"attribute":0.18974186480045319,"[":0.007109035272151232,"equality":0.22630280256271362,"computers":0.0676659643650055,"email":0.005342117045074701,"_":0.07362290471792221,"ordered":0.3384864926338196,"##grade":0.12720295786857605,"languages":0.19539642333984375,"d":0.019955016672611237,"learn":0.3753136992454529,"##hema":0.23897914588451385,"fastest":0.057029418647289276,"column":0.45626747608184814,"##dicate":0.011218545027077198,"dept":0.006437854841351509,"many":0.09639047831296921,"##ocating":0.2931099832057953,"single":0.29685792326927185,"##esian":0.12348886579275131,"##00":0.06503232568502426,"##01":0.041804004460573196,"##pr":0.15534605085849762,"automated":0.11233938485383987,"##spar":0.047363944351673126,"advantages":0.05206727981567383,"##qual":0.42362430691719055,"ibm":0.12473424524068832,"z":0.9871567487716675,"information":0.03485803306102753,"##ance":0.31101933121681213,"analytic":0.4133577346801758,"db":0.24880702793598175,"performs":0.05024944990873337,"language":0.23022715747356415,"run":0.19265735149383545,"source":0.18123847246170044,"##pers":0.04080526903271675,"ds":0.5643783807754517,"##ba":0.0800715759396553,"analytics":0.297265887260437,"red":0.2566937804222107,"155":0.2821919023990631,"apache":0.030644062906503677,"bias":0.009037273935973644,"tim":0.5261267423629761,"##imi":0.21299658715724945,"##rate":0.034109294414520264,"ur":0.29414480924606323,"##erate":0.013851393014192581,"##load":0.1553620845079422,"computational":0.03845427557826042,"disadvantage":0.06357044726610184,"oracle":0.2746211588382721,"maps":0.2341509312391281,"query":0.42538294196128845,"##by":0.01673106476664543,"learns":0.01357459370046854,"batch":0.012385774403810501,"##ried":0.016905443742871284,"encoding":0.12707525491714478,"##table":0.0993351936340332,"users":0.25404736399650574,"article":0.09711126983165741,"##25":0.05636368691921234,"##bf":0.1660819947719574,"laboratory":0.03237500786781311,"learnt":0.132745161652565,"##ede":0.05963512137532234,"spaces":0.016620932146906853,"citing":0.0408446341753006,"##ves":0.017723247408866882,"que":0.1713765263557434,"allow":0.09928940236568451,"formats":0.2293427288532257,"analytical":0.3497486710548401,"records":0.19360238313674927,"importance":0.20033660531044006,"isbn":0.21413809061050415,"mass":0.017713423818349838,"learning":0.510498046875,"aggregation":0.14342676103115082,"##forms":0.043622005730867386,"training":0.020688826218247414,"##ved":0.09804407507181168,"representation":0.21157827973365784,"content":0.2878567576408386,"##hir":0.23544663190841675,"ding":0.28023606538772583,"##lab":0.008613244630396366,"gao":0.4475809931755066,"load":0.07193736732006073,"authorship":0.10370877385139465,"sorting":0.3242869973182678,"uneven":0.29162105917930603,"lakes":0.22452418506145477,"selecting":0.018437180668115616,"digital":0.2850770056247711,"allocation":0.662749707698822,"learned":0.3645995259284973,"citation":0.312406986951828,"##base":0.08009570837020874,"multiple":0.3822598159313202,"perform":0.29596203565597534,"filters":0.32201069593429565,"##51":0.07544213533401489,"une":0.4399344027042389,"##52":0.051661089062690735,"##53":0.12339938431978226,"layout":0.5517568588256836,"equal":0.5272729992866516,"##time":0.2230142056941986,"better":0.02494647540152073,"##de":0.43980395793914795,"1722":0.09323479980230331,"1721":0.37437674403190613,"artificial":0.3375431299209595,"superior":0.23389850556850433,"##form":0.11233292520046234,"##46":0.05102076753973961,"pdf":0.29558610916137695,"publish":0.10508351773023605,"analyst":0.006745306774973869,"achieved":0.004255767446011305,"relational":0.1257719248533249,"contributors":0.013614584691822529,"hd":0.018808191642165184,"pub":0.010735852643847466,"jia":0.1699633151292801,"software":0.03815966844558716,"bin":0.0027022953145205975,"bit":0.7877194285392761,"type":0.12776340544223785,"multi":0.16939163208007812,"improved":0.11039026081562042,"number":0.06254927068948746,"tables":0.40934592485427856,"##ifier":0.0891495943069458,"filtered":0.24368402361869812,"optimization":0.3829959034919739,"scans":0.2617490291595459,"enable":0.05877969413995743,"massachusetts":0.43274036049842834,"id":0.27644386887550354,"##va":0.10217668116092682,"zinc":0.2906571924686432,"##nse":0.059307459741830826,"order":0.9206082224845886,"algorithm":0.23199047148227692,"##ve":0.02768038585782051,"mapping":0.30640336871147156,"method":0.008963387459516525,"byte":0.35058197379112244,"##lice":0.10351115465164185,"inter":0.3947453796863556,"bits":0.5582915544509888,"handle":0.1362648755311966,"##cing":0.03220481425523758,"impacts":0.1032881960272789,"ze":0.08207187801599503,"transactions":0.005547333974391222,"##brick":0.4680192470550537,"intelligence":0.330859899520874,"inequality":0.07317159324884415,"system":0.1878315508365631,"##sing":0.06118593364953995,"issn":0.03432163596153259,"binary":0.35691967606544495,"orders":0.6147248148918152,"madden":0.4670356512069702,"##ft":0.16711796820163727,"hash":0.14845386147499084,"authors":0.05349148064851761,"hive":0.10941248387098312,"algorithms":0.20582322776317596,"server":0.04510162025690079,"##per":0.2571779489517212,"columns":0.4761648178100586,"methods":0.030148493126034737,"commons":0.20032580196857452,"enabled":0.007111972663551569,"computer":0.24438607692718506,"##bit":0.45112523436546326,"##oca":0.3174950182437897,"file":0.2519204914569855,"modern":0.06856527179479599,"electronic":0.2123681902885437,"ability":0.17817836999893188,"map":0.28306108713150024,"table":0.5291950702667236,"##formed":0.11044774949550629,"include":0.012675940059125423,"##bution":0.005348882172256708,"##ifiers":0.07033563405275345,"marko":0.08189871162176132,"filter":0.4231155514717102,"excel":0.08036530762910843,"##hi":0.1801939308643341,"##ent":0.029968516901135445,"grid":0.1031641885638237,"equals":0.22670629620552063,"cite":0.22858817875385284,"php":0.08047708868980408,"attributes":0.16983848810195923,"##ration":0.06306586414575577,"logic":0.02412441000342369,"queue":0.12793013453483582,"##ord":0.3546735644340515,"statistics":0.06198815628886223,"date":0.21785657107830048,"auto":0.030108556151390076,"data":0.6760654449462891,"##gre":0.11916826665401459,"##vos":0.03054223023355007,"equally":0.24402853846549988,"use":0.17297156155109406,"integer":0.16759011149406433,"used":0.0454009473323822,"lab":0.018133189529180527,"space":0.16429032385349274,"faster":0.07724310457706451,"automation":0.08718021959066391,"publication":0.3000849485397339,"poole":0.10123425722122192,"##code":0.008629622869193554,"publishers":0.1323641985654831,"links":0.01752213016152382,"jenny":0.3556477427482605,"different":0.04810444265604019,"evie":0.0642511174082756,"manually":0.10884223133325577,"offset":0.41405484080314636,"resource":0.22709403932094574,"kind":0.3431462347507477,"author":0.13703195750713348,"##pace":0.4820011258125305,"format":0.29303693771362305,"cpu":0.0015116772847250104,"sort":0.696371853351593,"published":0.1815396100282669,"dong":0.012178405188024044,"amazon":0.5578664541244507,"important":0.2831951379776001,"license":0.00780289014801383,"##pro":0.15093915164470673,"202":0.14729352295398712,"δ":1.6868248349055648E-4,"improve":0.2558715343475342,"##zes":0.1513432413339615,"techniques":0.1467120200395584,"publisher":0.2535020112991333,"files":0.07971792668104172,"lake":0.5228524208068848,"code":0.09975213557481766,"##duction":0.317937433719635,"scala":0.04854529723525047,"##ducted":0.01088029146194458,"values":0.37814390659332275,"technique":0.173899844288826,"why":0.0562930554151535,"best":0.39770081639289856,"##oop":0.11726821213960648,"sql":0.41972771286964417,"aggregate":0.13521195948123932,"##lin":0.032649021595716476,"database":0.44329482316970825,"##ving":0.3550584316253662,"computing":0.13067889213562012,"array":0.13752031326293945,"##8":0.019894972443580627,"row":0.4275399148464203,"brick":0.006735978648066521,"value":0.5642986297607422,"included":0.07402681559324265,"sam":0.08993932604789734,"allocated":0.36716926097869873,"allows":0.08835143595933914,"sap":0.1717306524515152,"assignment":0.07762989401817322,"advantage":0.04922306537628174,"performing":0.17939020693302155,"automatic":0.11095517128705978,"resources":0.017588043585419655,"rows":0.40649473667144775,"##asa":0.19702963531017303,"lakeside":0.019438952207565308,"performance":0.6050975918769836,"application":0.12656168639659882,"variance":0.04044201597571373,"bytes":0.11088438332080841,"##set":0.20326173305511475,"user":0.24444986879825592,"timothy":0.0995791032910347},"dates":[{"kind":"Publication date","value":"2024-06-09"}],"source":"DSpace@MIT","title":"Learning Bit Allocations for Z-Order Layouts in Analytic Data Systems","source_link":"https://dspace.mit.edu/handle/1721.1/155538","content_type":["Article"],"rights":[{"description":"Creative Commons Attribution","kind":"useAndReproduction"}],"publishers":[{"name":"ACM"}],"links":[{"url":"https://hdl.handle.net/1721.1/155538","kind":"Digital object URL","text":"Digital object URL"}],"contributors":[{"value":"Gao, Jenny","kind":"author"},{"value":"Ding, Jialin","kind":"author"},{"value":"Sudhir, Sivaprasad","kind":"author"},{"value":"Madden, Samuel","kind":"author"},{"value":"Massachusetts Institute of Technology. Computer Science and Artificial Intelligence Laboratory","kind":"department"}],"timdex_record_id":"dspace:1721.1-155538"},"sort":[9.546787,1717891200000]},{"_index":"dspace-2026-02-09t19-23-02","_id":"dspace:1721.1-154387","_score":9.4433565,"_source":{"summary":["Community organizations face challenges in harnessing the power of qualitative data analysis, or sensemaking, to understand the diverse perspectives and needs brought up by their constituents. One of the most time-consuming and tedious parts of sensemaking is qualitative coding, or the process of identifying themes across a large and unstructured corpus of community input. A challenge in qualitative coding is attaining high intercoder reliability, especially between expert and beginner sensemakers. In this work, we present SenseMate, a novel human-AI system designed to help with qualitative coding. SenseMate leverages rationale extraction models, a new machine learning strategy to semi-automate sensemaking, which produces theme recommendations and human-interpretable explanations. The models were trained on a dataset of people’s experiences living in Boston, which was annotated for themes by expert sensemakers. We integrated rationale extraction models into SenseMate through an iterative, human-centered design process revolving around four key design principles derived from an extensive literature review. The design process consisted of three iterations with continuous feedback from seven people associated with community organizations. Through an online experiment involving 180 novice sensemakers, we aimed to determine whether AI-generated recommendations and rationales would decrease coding time, increase intercoder reliability (i.e. Cohen’s kappa), and minimize differences between novice and expert coding decisions (i.e. F-score of participant answers compared to expert gold labels). We found that though the model recommendations and explanations increased coding time by 49 seconds per unit of analysis, they raised intercoder reliability by 29% and coding F-score by 10%. Regarding the effectiveness of SenseMate’s design, participants reported that the platform was generally easy to use. In summary, Sensemate is (1) built for beginner sensemakers without a technical background, a user group that prior work doesn’t focus on, (2) implements rationale extraction models to recommend themes and generate explanations, which has advantages over large language models in terms of user privacy and control, and (3) contains original and intuitive features created from user feedback that can be applied to future QDA systems."],"timdex_provenance":{"source":"dspace","run_date":"2026-04-15","run_id":"a816f3dc-51ac-7e5f-cec8-1086ffc54274_861de409-c771-2e2c-c416-93c81a0885e3","run_record_offset":1268},"languages":["en"],"citation":"Overney, Cassandra, Saldías, Belén, Dimitrakopoulou, Dimitra and Roy, Deb. 2024. \"SenseMate: An Accessible and Beginner-Friendly Human-AI Platform for Qualitative Data Analysis.\"","file_formats":["application/pdf"],"identifiers":[{"value":"979-8-4007-0508-3","kind":"isbn"},{"value":"https://hdl.handle.net/1721.1/154387","kind":"uri"},{"value":"PUBLISHER_CC","kind":"mitlicense"}],"format":"electronic resource","embedding_full_record":{"authored":0.035051047801971436,"inform":0.06282131373882294,"##e":0.08132171630859375,"accessibility":0.028527820482850075,"##naire":0.005242400802671909,"objects":0.04176513850688934,"##i":0.03379335254430771,"expertise":0.29869720339775085,"explanation":0.26510685682296753,"extracted":0.2184520810842514,"##m":0.20111896097660065,"analyzing":0.20308400690555573,"themes":0.4190088212490082,"score":0.3426027297973633,"##q":0.03764427453279495,"##r":0.25920504331588745,"ted":0.2116296887397766,"record":0.08737974613904953,"##x":0.19815993309020996,"##ances":0.05249284207820892,"api":0.07814959436655045,"publishing":0.22862908244132996,"knowledge":0.041195452213287354,"organizational":0.03853921592235565,"app":0.0057275728322565556,"models":0.29642578959465027,"ac":0.2689822018146515,"qu":0.6487764120101929,"ai":0.5749683976173401,"community":0.6332842111587524,"analysis":0.4631650149822235,"labels":0.2387954145669937,"input":0.16986563801765442,"cognitive":0.0638701319694519,"cassandra":0.48310691118240356,"institute":0.283805251121521,"agile":0.12193569540977478,"##ructured":0.030908985063433647,"object":0.1899774968624115,"boston":0.532672643661499,"@":0.04426391050219536,"accessible":0.47574836015701294,"##rak":0.2191564440727234,"statistical":0.20313100516796112,"access":0.23274201154708862,"achieve":0.05453372746706009,"experiments":0.21742016077041626,"cited":0.1530768871307373,"recommend":0.01034724060446024,"proven":0.3094492256641388,"stakeholders":0.014067808166146278,"##des":0.15421603620052338,"lowell":0.023591695353388786,"centred":0.060578010976314545,"gold":0.4576416015625,"coding":0.6138292551040649,"##op":0.11582937836647034,"how":0.017433052882552147,"citations":0.23693221807479858,"journal":0.03258036822080612,"systems":0.13112342357635498,"##ou":0.14403656125068665,"mit":0.6163773536682129,"perspective":0.030390962958335876,"u2":0.15929248929023743,"rational":0.6255239844322205,"email":0.00978733692318201,"participants":0.24756966531276703,"minimize":0.011021852493286133,"scoring":0.10205505788326263,"languages":0.2596634030342102,"ness":0.09451276808977127,"decision":0.07538028806447983,"learn":0.05019080266356468,"strategies":0.0427527092397213,"f":0.2134874165058136,"##qi":0.016525818035006523,"maker":0.4353676736354828,"##00":0.07733181864023209,"q":0.43233540654182434,"##01":0.3815893232822418,"automated":0.21505804359912872,"advantages":0.12956009805202484,"ibm":0.10085424035787582,"difficulties":0.020362505689263344,"##ance":0.3328593075275421,"experts":0.19899599254131317,"analytic":0.14596043527126312,"novel":0.25678157806396484,"cohen":0.392900288105011,"##re":0.03682249039411545,"##maker":0.4992017149925232,"senses":0.3948008120059967,"centered":0.15573710203170776,"bel":0.31373274326324463,"dim":0.4600251317024231,"corpus":0.26694056391716003,"project":0.052088454365730286,"organisation":0.033401697874069214,"language":0.28878054022789,"run":0.15091240406036377,"source":0.1916714459657669,"recommendations":0.29926830530166626,"challenging":0.23529981076717377,"robotic":0.037060074508190155,"participant":0.27675384283065796,"research":0.2704782485961914,"##erated":0.18130774796009064,"ds":0.4985189139842987,"analytics":0.2797783315181732,"154":0.2526302933692932,"apache":0.013102480210363865,"##16":0.0582435168325901,"generated":0.002932940609753132,"bias":0.03625337406992912,"tim":0.5087875127792358,"cambridge":0.08441949635744095,"##erate":0.23876076936721802,"ur":0.18739086389541626,"generate":0.11770779639482498,"benji":0.23126667737960815,"programming":0.06988358497619629,"##ra":0.18453124165534973,"computational":0.06027847155928612,"making":0.2665744125843048,"cassie":0.1479817032814026,"encoding":0.18924127519130707,"##anal":0.008626587688922882,"users":0.2094803750514984,"article":0.09237034618854523,"decrease":0.03825388103723526,"technologies":0.016122395172715187,"##rs":0.05912037566304207,"extract":0.3782912492752075,"labs":0.09293016046285629,"laboratory":0.14424127340316772,"##tri":0.04157785326242447,"##mate":0.6582593321800232,"##ney":0.4323630928993225,"##eda":0.15500770509243011,"implements":0.01640520989894867,"analysts":0.1332501769065857,"identifying":0.11849416047334671,"formats":0.13793087005615234,"analytical":0.16800591349601746,"trained":0.12276292592287064,"technical":0.02165394462645054,"##ner":0.2872452437877655,"isbn":0.14096680283546448,"mass":0.0724702700972557,"##das":0.0509328618645668,"privacy":0.130516916513443,"learning":0.3040916323661804,"generating":0.1052420437335968,"training":0.03191087767481804,"##da":0.3815576434135437,"content":0.2320048213005066,"##mates":0.3913726508617401,"##lab":0.1870255470275879,"##38":0.3308315575122833,"constituent":0.0710059106349945,"authorship":0.13747037947177887,"##works":0.13579291105270386,"##erative":0.35729625821113586,"human":0.615001916885376,"effectiveness":0.30049118399620056,"digital":0.23933692276477814,"over":0.13287189602851868,"sensing":0.16831223666667938,"identify":0.11695647984743118,"citation":0.30686378479003906,"org":0.13627828657627106,"label":0.18924663960933685,"technology":0.011215594597160816,"##de":0.48303723335266113,"1721":0.37728413939476013,"artificial":0.28751522302627563,"##tative":0.3082575798034668,"pdf":0.21772795915603638,"what":0.02482382394373417,"regression":0.038391001522541046,"interpret":0.17905323207378387,"publish":0.13351409137248993,"analyst":0.22922657430171967,"time":0.14322371780872345,"contributors":0.10566365718841553,"humans":0.27522870898246765,"##mat":0.4652155935764313,"expert":0.49974989891052246,"copyright":0.051196254789829254,"modeling":0.13935725390911102,"software":0.3605682849884033,"##ova":0.06541246920824051,"reasoning":0.033351294696331024,"answers":0.15515689551830292,"recommendation":0.16008546948432922,"experimental":0.11188173294067383,"program":0.06624230742454529,"##lou":0.16504016518592834,"repository":0.10962186008691788,"tracking":0.08352763950824738,"feedback":0.32149291038513184,"reliable":0.3667137324810028,"seconds":0.17527374625205994,"##ifier":0.08526135236024857,"experiment":0.18945787847042084,"massachusetts":0.47145307064056396,"##metric":0.04275393486022949,"model":0.42059797048568726,"id":0.24419085681438446,"attain":0.06016109138727188,"##nse":0.056586481630802155,"dashboard":0.004016093444079161,"algorithm":0.16322889924049377,"reduce":0.1888086348772049,"method":0.08581071346998215,"bernstein":0.06699823588132858,"makers":0.3030698299407959,"##lice":0.07329797744750977,"inter":0.31470656394958496,"sense":0.9036610722541809,"handle":0.11826173216104507,"extraction":0.4859105348587036,"creative":0.04388612136244774,"intelligence":0.2981560230255127,"system":0.2808053195476532,"anal":0.16004976630210876,"mate":0.2992863953113556,"analyze":0.1790120005607605,"begin":0.3502543270587921,"authors":0.10251028090715408,"algorithms":0.19313032925128937,"##ners":0.17415238916873932,"##opus":0.026644907891750336,"methods":0.06514622271060944,"##making":0.5086442232131958,"reliability":0.4897269606590271,"1086":0.02147059515118599,"##rik":0.005265388637781143,"tools":0.1379694789648056,"commons":0.28006333112716675,"file":0.09767690300941467,"labeling":0.10502620041370392,"rights":0.0809420645236969,"electronic":0.08855943381786346,"kappa":0.3609430491924286,"theme":0.2821459174156189,"decisions":0.050843264907598495,"semi":0.20579898357391357,"mat":0.03935711830854416,"##bution":0.04513884335756302,"##ifiers":0.053571682423353195,"topics":0.05196664482355118,"##analysis":0.004478557500988245,"##mine":0.01532280258834362,"framework":0.14251819252967834,"machine":0.3345792889595032,"organization":0.23345711827278137,"attaining":0.021440278738737106,"cite":0.22154971957206726,"##matic":0.21605119109153748,"logic":0.002418737392872572,"##ious":0.2040206640958786,"communities":0.15400616824626923,"statistics":0.07871727645397186,"date":0.007453802041709423,"codes":0.3610258996486664,"auto":0.20051531493663788,"data":0.65194171667099,"friendly":0.2469787895679474,"use":0.03075730986893177,"##kit":0.18667320907115936,"lab":0.15061163902282715,"experience":0.04960618540644646,"space":0.16616274416446686,"platforms":0.4684470295906067,"cloud":0.002752522239461541,"automation":0.23452305793762207,"publication":0.2969970703125,"##code":0.4320138990879059,"implemented":0.05204259976744652,"publishers":0.1386297196149826,"links":0.03974438086152077,"##it":0.2528035640716553,"novice":0.2863676846027374,"offset":0.323904812335968,"resource":0.21134056150913239,"kind":0.374551385641098,"author":0.13521341979503632,"##pace":0.5117388963699341,"format":0.15335878729820251,"published":0.19998370110988617,"lever":0.09117842465639114,"sort":0.03532331809401512,"tool":0.168864443898201,"coded":0.19451193511486053,"##pro":0.19863785803318024,"202":0.04411529377102852,"improve":0.15976838767528534,"principles":0.12092729657888412,"publisher":0.26699748635292053,"harvard":0.08264971524477005,"leverage":0.1748998761177063,"code":0.5485436320304871,"##makers":0.5238969326019287,"challenges":0.43933919072151184,"##duction":0.28251126408576965,"scores":0.2197219282388687,"university":0.10327746719121933,"media":0.2542506158351898,"platform":0.6204308271408081,"##oop":0.00379504868760705,"integrated":0.15468668937683105,"##0":0.051281049847602844,"effective":0.2509269416332245,"database":0.11966229975223541,"computing":0.10283888131380081,"contributor":0.0066841677762568,"design":0.2160433679819107,"##mation":0.2527078688144684,"##9":0.2727002799510956,"explanations":0.18102280795574188,"iteration":0.11443653702735901,"value":0.49062657356262207,"roy":0.37618160247802734,"designed":0.06108715757727623,"tufts":0.045916639268398285,"sal":0.33477404713630676,"##ass":0.06895346939563751,"ann":0.0852084830403328,"process":0.1884927749633789,"advantage":0.11806756258010864,"implementation":0.04129289090633392,"resources":0.09135549515485764,"automatic":0.045687828212976456,"intuitive":0.2530251443386078,"##iously":0.1038883700966835,"application":0.12180248647928238,"sensory":0.22024789452552795,"perspectives":0.1245889961719513,"quantitative":0.14497458934783936,"scored":0.037400029599666595,"harness":0.2570073902606964,"organizations":0.07453785091638565,"challenge":0.43475213646888733,"online":0.006716557778418064,"##set":0.17296698689460754,"strategy":0.16645577549934387,"user":0.2643160820007324,"constituents":0.09501903504133224,"timothy":0.011857268400490284,"methodology":0.13665473461151123},"dates":[{"kind":"Publication date","value":"2024-03-18"}],"source":"DSpace@MIT","title":"SenseMate: An Accessible and Beginner-Friendly Human-AI Platform for Qualitative Data Analysis","source_link":"https://dspace.mit.edu/handle/1721.1/154387","content_type":["Article"],"rights":[{"description":"Creative Commons Attribution","kind":"useAndReproduction"}],"publishers":[{"name":"ACM"}],"links":[{"url":"https://hdl.handle.net/1721.1/154387","kind":"Digital object URL","text":"Digital object URL"}],"contributors":[{"value":"Overney, Cassandra","kind":"author"},{"value":"Saldías, Belén","kind":"author"},{"value":"Dimitrakopoulou, Dimitra","kind":"author"},{"value":"Roy, Deb","kind":"author"},{"value":"Massachusetts Institute of Technology. Media Laboratory","kind":"department"}],"timdex_record_id":"dspace:1721.1-154387"},"sort":[9.4433565,1710720000000]},{"_index":"mitlibwebsite-2026-02-12t15-43-22","_id":"mitlibwebsite:b1bef9479956f640630924cb5a1e5760","_score":9.424737,"_source":{"source":"MIT Libraries Website","source_link":"https://libraries.mit.edu/data-services/gis-data-lab/","timdex_record_id":"mitlibwebsite:b1bef9479956f640630924cb5a1e5760","title":"GIS & Data Lab | MIT Libraries","citation":"MIT Libraries. GIS & Data Lab | MIT Libraries. Website. https://libraries.mit.edu/data-services/gis-data-lab/","content_type":["Website"],"contributors":[{"value":"MIT Libraries","kind":"creator","mit_affiliated":true}],"dates":[{"kind":"Accessed","value":"2026-04-04T23:03:32.754845+00:00"}],"format":"electronic resource","fulltext":"GIS & Data Lab The GIS & Data Lab, housed on the 1st floor of Rotch Library (7-238) , is available for use during Rotch’s operating hours . Computers and in-person help is available for the MIT Community only. See Data Services for more info on how to get help. Using the lab Valid MIT ID required for access. The lab can be used for group study, but there are no private study rooms. The lab may occasionally be reserved in part or full for workshops. Information on closures for workshops will be posted on our GIS guide . Computers The GIS & Data Lab is open to all MIT community members. A reservation is required if you will be using a computer remotely. Computers Computers: 16 are available in the Lab and 1 in the front alcove. In-person access is available during Rotch’s operating hours , MIT ID required. MIT Athena (kerberos) is required for login on all computers. High performance computers: Computers #1-8: Alienware Area-51 AAT2250 Processor: Intel(R) Core( TM ) Ultra 9 285K processor (24-Core, 76MB Total Cache, 3.7GHz to 5.7GHz) GPU: RTX5090; 32GB GDDR7 RAM: 64GB Dual Channel DDR5 XMP , 2x 32GB, 6400 MT/s Drives: 1TB NVMe M.2 PCIe Gen4 SSD (Boot) + 2TB NVMe M.2 PCIe Gen4 SSD (Storage) Computers #9-16: Alienware Aurora R15 Processor: 13th gen Intel Core i9-13900F: 24 cores (8 performance, 16 efficient); 32 threads; 2.00-5.60 GHz GPU: RTX4090; Ada Lovelace architecture with 16384 CUDA cores and 8.9 compute capability; 24GB GDDR6 RAM: 64GB, 2x32GB, DDR5, 4800MHz Drives: 1TB NVMe M.2 PCle SSD (Boot); 2TB 7200RPM SATA 6 Gb/s (Storage) Monitors Free-standing monitors with a variety of connectors that you can use with your own laptop, tablet, etc. 27″ monitors: 4 available — 2 at tables and 2 at desks in open cubes 48″ monitors: 4 available — 1 at each of the computer clusters 75″ monitor: 1 available in the front alcove Data storage Upon logging off, all files will be cleared. For temporary data storage, utilize the shared drives, accessible via the File Explorer path: This PC > UserData(D:) > UserData > and create a folder using your kerberos name (this allows staff to contact you). Mislabeled folders will be deleted. The GIS & Data lab is not an archive and data could be deleted at any time; be sure to properly manage and back up your data. For help with data management or storage, contact Data Management Services . Power settings Computers should never be shut down to allow for shared drive access at all times (locking of machines is allowed during remote access only). Remote access GIS & Data Lab computers can be used remotely during the following times: Weekends (6pm Friday – 10am Monday) When Rotch Library is closed for an extended period of time (holidays, Institute breaks, etc.) While running an analysis, process, etc. that takes longer than 1 day If a personal circumstance prevents you from coming to the lab in person (sickness, extended remote working arrangement, etc.) To use a computer remotely, you MUST email gishelp@mit.edu to schedule a reservation BEFORE beginning your work. Use policies Use of installed software on the computers takes priority over other uses of the machines. See full list of software below. A reservation is required if you will not be using a computer in-person. Reservations cannot be made for more than 1 week, but can be renewed if a computer is available. If you do not renew a reservation the computer will be re-started so that others may use it. GIS staff are not responsible for monitoring the computer. We will place a sign on computers that are being used remotely. But, the GIS & Data lab is open to all MIT community members and computers could accidentally get re-started or unplugged. Software The following software is installed on all computers unless otherwise indicated. Use of licensed software is restricted to members of the MIT community for the purposes of research, education, and scholarship. Additional software may be requested pending relevance, cost, and licensing terms by emailing gishelp@mit.edu . GIS & mapping software ArcGIS Pro ESRI Business Analyst with 2025 data* ArcGIS StreetMap Premium North America 2025* CityEngine Google Earth GeoDa QGIS *Your ArcGIS account may not automatically have these licenses activated. Contact GIS Services and we’ll add them to your account. Imagery & visualization software Adobe Acrobat, Illustrator & Photoshop (sign in with your MIT Adobe ID ) AutoCAD Civil 3D Drone2Map ( Contact GIS Services for an Advanced license . Standard licenses are included with every ArcGIS account.*) Fusion 360 Rhino 8 SolidWorks *Your ArcGIS account may not automatically have these licenses activated. Contact GIS Services and we’ll add them to your account. Data analysis software Anaconda python (to open Jupyter Lab, run ‘python -m jupyterlab’ from an Anaconda prompt) Mathematica MATLAB NVIDIA CUDA Toolkit (computers #9 – 16) R & RStudio QualCoder Terms of use Use of licensed software is restricted to members of the MIT community for the purposes of research, education, and scholarship. Under MIT’s licenses, users generally may not: redistribute the software or materials or permit use to anyone other than a member of the MIT community. remove, obscure, or modify any copyright or other notices included in the software or materials. use the software or materials for commercial purposes. Leaving MIT: When a member of the organization terminates affiliation with the organization or a member’s affiliation with the organization is terminated by the organization or a person not affiliated with the organization leaves campus, the member or person must destroy all personal copies of the software or derived data. Users are individually responsible for compliance with these terms.","links":[{"url":"https://libraries.mit.edu/data-services/gis-data-lab/","kind":"Website"}],"summary":["The GIS & Data Lab, housed on the 1st floor of Rotch Library (7-238), is available for use during Rotch’s operating hours. Computers and in-person help is available for the MIT Community only. See Data Services for more info on how to get help.   Using the lab Valid MIT ID required for access. The lab can be used for group study, but there are no private study rooms. The lab may occasionally be reserved in part or full for workshops. Information on closures for workshops will be posted on our GIS guide. Computers The GIS & Data Lab is […]"],"timdex_provenance":{"source":"mitlibwebsite","run_date":"2026-04-04","run_id":"6af9300c-524a-346b-f7c6-95e232e9f577_1e3e4c5d-27a2-a415-76eb-850434dee63e","run_record_offset":23},"embedding_full_record":{"temporary":0.3654845654964447,"13th":0.1351357102394104,"##b":0.06453821063041687,"##d":0.07596438378095627,"chips":0.05331551283597946,"unavailable":0.11252521723508835,"##mit":0.18355657160282135,"allowed":0.1202281266450882,"del":0.07541073858737946,"##frame":0.11408128589391708,"remote":0.5634795427322388,"laptop":0.4362953305244446,"b1":0.10816781222820282,"setting":0.032384831458330154,"##p":0.09528923034667969,"##cula":0.009728140197694302,"##s":0.5322184562683105,"##u":0.18634942173957825,"##v":0.025233307853341103,"##x":0.1623091697692871,"visual":0.189195916056633,"cube":0.37343570590019226,"ram":0.3477017879486084,"rams":0.09549999982118607,"aa":0.0777849480509758,"databases":0.06855670362710953,"ac":0.056383874267339706,"solid":0.40522417426109314,"agreement":0.026734834536910057,"&":0.08959833532571793,"google":0.3441809415817261,"require":0.17154176533222198,"personal":0.04299383610486984,"reserves":0.02714671939611435,"community":0.3408643901348114,"analysis":0.19202661514282227,"version":0.11045179516077042,"##tica":0.1575927734375,"folder":0.2647475302219391,"reserved":0.32578080892562866,"domain":0.07960053533315659,"institute":0.19577035307884216,"unused":0.04045620560646057,"drive":0.3936574459075928,"accessible":0.27701643109321594,"cited":0.011282828636467457,"proven":0.08983337134122849,"arcs":0.2142050564289093,"posted":0.06794922798871994,"##text":0.03294653445482254,"how":0.15534046292304993,"capability":0.034109797328710556,"##lock":0.02857831120491028,"citations":0.0972217470407486,"dual":0.08591464906930923,"civil":0.22927667200565338,"close":0.2885960638523102,"computers":0.5369840860366821,"policy":0.22356820106506348,"website":0.3260914981365204,"licensed":0.37861353158950806,"address":0.1818224936723709,"g":0.12096512317657471,"adobe":0.3497765064239502,"i":0.07103727757930756,"photo":0.013630389235913754,"staff":0.25648003816604614,"n":0.16366815567016602,"q":0.19165246188640594,"licenses":0.4894740581512451,"r":0.11602704972028732,"cu":0.07596282660961151,"deleted":0.21516557037830353,"x":0.005551150534301996,"days":0.02787991240620613,"##ance":0.2243361920118332,"under":0.044970057904720306,"dd":0.12081380933523178,"standard":0.10439934581518173,"rooms":0.1423303484916687,"sites":0.07763033360242844,"graphics":0.09533413499593735,"do":0.0034476411528885365,"down":0.16103309392929077,"analytics":0.0498509518802166,"red":0.019144656136631966,"##af":0.04817960411310196,"leave":0.1952195018529892,"contact":0.36216437816619873,"scholarship":0.0589507520198822,"copying":0.055666666477918625,"tim":0.3696863055229187,"programming":0.08392518013715744,"vault":9.467274066992104E-4,"ada":0.46189504861831665,"info":0.07839524745941162,"ed":0.0645895004272461,"computational":0.014624999836087227,"add":0.1540677845478058,"area":0.06406340003013611,"##bu":0.05501757934689522,"need":0.027674410492181778,"scholar":0.031369056552648544,"es":0.442398339509964,"##ca":0.36007416248321533,"users":0.2762467563152313,"##cb":0.04804123938083649,"fusion":0.3381391167640686,"take":0.16834834218025208,"ethernet":0.02141638658940792,"labs":0.4807415008544922,"720":0.06268131732940674,"materials":0.06259564310312271,"##mber":0.014917701482772827,"activation":0.2660302519798279,"private":0.2935381531715393,"##ete":0.10766323655843735,"back":0.022938067093491554,"##da":0.34735772013664246,"directory":0.03763410076498985,"remove":0.13911983370780945,"content":0.07477352023124695,"commercially":0.04639481008052826,"##lab":0.3088116943836212,"desktop":0.13125048577785492,"##ch":0.4592400789260864,"##down":0.18861930072307587,"responsible":0.1466752141714096,"gb":0.1806521862745285,"##con":0.27995869517326355,"##co":0.09446986019611359,"##com":0.02780052274465561,"gi":0.7250070571899414,"citation":0.17668429017066956,"gp":0.25085705518722534,"monitor":0.23653993010520935,"permission":0.1416502743959427,"room":0.20632793009281158,"##dd":0.11201867461204529,"##de":0.2850935459136963,"schedule":0.17454488575458527,"berkeley":0.10503718256950378,"management":0.06000640243291855,"service":0.20888416469097137,"permit":0.13569539785385132,"analyst":0.1930740475654602,"renew":0.2190217673778534,"prompt":0.1853492558002472,"illustrator":0.2253527045249939,"college":0.08678863197565079,"copyright":0.3963976204395294,"backup":0.1925429254770279,"advanced":0.13221463561058044,"catalog":0.042652443051338196,"channel":0.07186266779899597,"accessed":0.1864752322435379,"ultra":0.10645633190870285,"number":0.24328960478305817,"tables":0.1634664386510849,"cores":0.26666778326034546,"imagery":0.25751587748527527,"##el":0.1734926551580429,"reservation":0.47475606203079224,"lock":0.2576926648616791,"id":0.5274039506912231,"join":8.808507118374109E-4,"spatial":0.22898322343826294,"mapping":0.33183833956718445,"python":0.32537445425987244,"aliens":0.13640156388282776,"##gb":0.16635553538799286,"intel":0.36862146854400635,"##lace":0.35673925280570984,"script":0.03987943381071091,"bosch":0.015234105288982391,"##fi":0.07359400391578674,"drives":0.382623553276062,"install":0.20629674196243286,"explorer":0.1953928917646408,"restriction":0.01216187048703432,"opens":0.04385947063565254,"remotely":0.5682311058044434,"server":0.2193082571029663,"drones":0.3498744070529938,"weekend":0.1833491027355194,"ju":0.328701376914978,"subscription":0.0543639101088047,"restrict":0.18907462060451508,"shutting":0.19830836355686188,"holiday":0.0877598226070404,"valid":0.3078593313694,"aix":0.004046247340738773,"library":0.6549643278121948,"file":0.24682952463626862,"member":0.2861456573009491,"electronic":0.07928576320409775,"ke":0.3500337302684784,"share":0.13075517117977142,"map":0.2826477885246277,"mat":0.20610454678535461,"break":0.17261867225170135,"clustered":0.007491969503462315,"##ie":0.04904327914118767,"off":0.19780050218105316,"machine":0.2123963087797165,"stored":0.39374879002571106,"cite":0.16153493523597717,"php":0.06117028370499611,"websites":0.2186228334903717,"gigs":0.13485164940357208,"communities":0.009054990485310555,"##eng":0.060086604207754135,"auto":0.24529430270195007,"mail":0.07105503976345062,"usb":0.19399461150169373,"use":0.45014840364456177,"sign":0.1222531795501709,"lab":0.6339790225028992,"photos":0.08690791577100754,"hacking":0.016866903752088547,"geographic":0.13661153614521027,"copies":0.019080523401498795,"mb":0.027304666116833687,"find":0.0886635109782219,"members":0.1611751765012741,"links":0.11840948462486267,"locked":0.3868386447429657,"closure":0.18299508094787598,"logs":0.1610739529132843,"##ix":0.007060069125145674,"settings":0.13670264184474945,"solids":0.11526772379875183,"utc":0.02553999051451683,"##ema":0.09853211045265198,"mt":0.06583943217992783,"cpu":0.31428468227386475,"restrictions":0.23364444077014923,"unmanned":0.002058938378468156,"tool":0.02878691256046295,"##chs":0.13538441061973572,"license":0.5540284514427185,"disk":0.22860778868198395,"panorama":0.04068895801901817,"202":0.08726964145898819,"activate":0.33132651448249817,"plug":0.004968840628862381,"unix":0.07357042282819748,"code":0.18526238203048706,"university":0.3538821339607239,"policies":0.24300870299339294,"storage":0.5019331574440002,"installing":0.062271662056446075,"running":0.022229012101888657,"##dio":0.09198670834302902,"##ist":0.026877818629145622,"ana":0.4012949764728546,"rot":0.617151141166687,"workshops":0.32430505752563477,"reserve":0.17794258892536163,"friday":0.040677785873413086,"working":0.033789392560720444,"floor":0.17105938494205475,"##ma":0.110246941447258,"##mb":0.032173916697502136,"##ches":0.008309381082654,"##me":0.20952939987182617,"requirement":0.028161806985735893,"thread":0.018322911113500595,"##tium":0.10174767673015594,"pc":0.32414084672927856,"reservations":0.3795376121997833,"application":0.0011401129886507988,"earth":0.2939286231994629,"ames":9.956273715943098E-4,"online":0.16793286800384521,"compliant":0.07040058076381683,"machines":0.2793514132499695,"activated":0.35082507133483887,"cluster":0.15073366463184357,"01":0.00901223998516798,"weekends":0.3302243649959564,"04":0.1327214241027832,"password":0.38595664501190186,"##mp":8.281758637167513E-4,"geography":0.08821521699428558,"238":0.19677874445915222,"##hop":0.09081418812274933,"cache":0.30556103587150574,"using":0.1813245415687561,"13":0.10241885483264923,"qu":0.15894094109535217,"16":0.03821611776947975,"##core":0.011462301015853882,"portable":0.00495459558442235,"monitoring":0.08766903728246689,"processor":0.3290497958660126,"360":0.04674113541841507,"requested":0.10424145311117172,"rd":0.0057022348046302795,"athena":0.43589696288108826,"programs":0.10907363146543503,"##ter":0.3124011754989624,"monitors":0.23324809968471527,"shared":0.3810494840145111,"rs":0.2778327763080597,"24":0.1737397462129593,"archives":0.15539109706878662,"rt":0.08931378275156021,"saturday":0.0012668212875723839,"access":0.5902746319770813,"automatically":0.04250474274158478,"##bat":0.08370920270681381,"##pl":0.07598043978214264,"long":0.1808221936225891,"extended":0.10552316904067993,"##vid":0.21250997483730316,"archived":0.11047869175672531,"arc":0.5634716153144836,"256":0.056447532027959824,"##os":0.24956370890140533,"permitted":0.12971748411655426,"mis":0.0968160554766655,"does":0.03923012688755989,"139":0.13979165256023407,"##sable":0.0914882943034172,"mit":0.8909351229667664,"where":0.15809383988380432,"##dee":0.004820171743631363,"operating":0.3295574188232422,"free":0.016702905297279358,"u2":0.21833884716033936,"email":0.36341872811317444,"32":0.18588732182979584,"ss":0.3041251003742218,"renewal":0.010871877893805504,"librarian":0.296083927154541,"services":0.2798433005809784,"many":0.11697066575288773,"tb":0.10708063095808029,"closes":0.04442311078310013,"stay":0.00805675145238638,"##00":0.19150492548942566,"##01":0.3538985550403595,"standing":0.13330736756324768,"ibm":0.07410449534654617,"closed":0.404484361410141,"##py":0.2299615889787674,"operation":0.04909311980009079,"open":0.34527286887168884,"contacts":0.1374504119157791,"commercial":0.10512807965278625,"##ri":0.180572047829628,"##boot":0.0947318822145462,"available":0.380865216255188,"project":0.0191352516412735,"run":0.22662955522537231,"source":0.004030237440019846,"secure":0.030902672559022903,"locks":0.2703421413898468,"research":0.2830505967140198,"##gis":0.4335803985595703,"housed":0.14493417739868164,"3d":0.2445223182439804,"##13":0.06445775181055069,"##14":0.03498341143131256,"holidays":0.19373223185539246,"##15":0.12029697746038437,"affiliation":0.20044738054275513,"##16":0.024492353200912476,"un":0.07253112643957138,"cambridge":0.06084177643060684,"51":0.2186763435602188,"ur":0.13101091980934143,"termination":0.019076796248555183,"oracle":0.0018728412687778473,"maps":0.2692752778530121,"##sh":0.1528163105249405,"saturdays":0.09807723015546799,"campus":0.2640620768070221,"telephone":0.03835966810584068,"collection":0.013530291616916656,"pro":0.200703427195549,"sharing":0.19393044710159302,"drone":0.38115018606185913,"##32":0.12530095875263214,"##22":0.23776088654994965,"286":0.03215445950627327,"##24":0.001433000317774713,"##25":0.011041944846510887,"##26":0.10518333315849304,"institutional":0.014800925739109516,"laboratory":0.4656549096107483,"desk":0.044805169105529785,"64":0.26839524507522583,"internet":0.0459894984960556,"installed":0.26198631525039673,"analysts":0.11624674499034882,"memory":0.29822900891304016,"##th":0.08775335550308228,"needed":0.1333228349685669,"scheduled":0.11658619344234467,"pending":0.08528593927621841,"##das":0.08150888234376907,"##40":0.0671197697520256,"##33":0.08463852107524872,"emails":0.05555330216884613,"##34":1.5644889208488166E-4,"##works":0.262484610080719,"street":0.18888914585113525,"linux":0.2333521842956543,"boot":0.09422937780618668,"derived":0.16186662018299103,"##ta":0.014989366754889488,"clusters":0.14321362972259521,"##mount":0.015017562545835972,"##rber":0.4209349453449249,"hours":0.4616566300392151,"##ug":0.16997483372688293,"breaks":0.1099405363202095,"locking":0.31703412532806396,"libraries":0.4931124746799469,"##50":0.010738236829638481,"##51":0.2289380431175232,"windows":0.10829204320907593,"storing":0.06634287536144257,"renewed":0.21126778423786163,"##tu":0.11269871890544891,"restricted":0.40404072403907776,"time":0.2756403982639313,"studio":0.026925787329673767,"##ware":0.2630075216293335,"software":0.608104944229126,"program":0.25162994861602783,"processors":0.22479519248008728,"during":0.180401012301445,"repository":0.146992489695549,"required":0.3481570780277252,"compatible":0.008965466171503067,"closing":0.07557568699121475,"terms":0.1754179149866104,"logged":0.037524279206991196,"collections":0.0010930560529232025,"##ged":0.17942176759243011,"guide":0.13857418298721313,"hardware":0.18368206918239594,"##lice":0.022864460945129395,"destroy":0.1841643750667572,"priority":0.07026099413633347,"phone":0.09985125809907913,"anyone":0.11256144195795059,"##rooms":0.0022731211502104998,"logging":0.2650340795516968,"reset":0.019842803478240967,"math":0.22860398888587952,"terminate":0.19953285157680511,"love":0.1450510323047638,"study":0.1415543556213379,"log":0.3585273027420044,"requests":0.06925483793020248,"aurora":0.39038917422294617,"tools":0.13957853615283966,"alien":0.5399145483970642,"commons":0.11876215040683746,"geo":0.4626583755016327,"gen":0.16917502880096436,"computer":0.5997594594955444,"premium":0.1743771880865097,"web":0.16272540390491486,"get":0.06603939831256866,"installation":0.02712150663137436,"copy":0.19943277537822723,"power":0.15009258687496185,"1638":0.201364204287529,"licensing":0.34398746490478516,"architecture":0.21563465893268585,"##90":0.08073090761899948,"display":0.0611240454018116,"help":0.09945982694625854,"site":0.16021035611629486,"nasa":0.014413142576813698,"organization":0.062033314257860184,"cannot":0.15980933606624603,"located":0.10364848375320435,"accounts":0.2059708833694458,"facility":0.07299534231424332,"date":0.13143588602542877,"shut":0.3395988345146179,"rhino":0.48679137229919434,"data":0.8810224533081055,"##kit":0.24066898226737976,"used":0.19967639446258545,"hosted":0.021497905254364014,"space":0.020921995863318443,"reference":0.03109738603234291,"##pire":0.07322899252176285,"##code":0.23383019864559174,"should":0.020055226981639862,"group":0.1389523297548294,"notebook":0.08337009698152542,"licence":0.39286813139915466,"offset":0.242637038230896,"resource":0.24745017290115356,"workshop":0.23023590445518494,"temporarily":0.1704375147819519,"format":0.1808134764432907,"archive":0.2943863868713379,"core":0.25308477878570557,"edo":0.001116161234676838,"person":0.01715748757123947,"ghz":0.24182714521884918,"files":0.31144821643829346,"send":0.03794536739587784,"request":0.21354015171527863,"disks":0.19553549587726593,"cad":0.21008867025375366,"link":0.16371695697307587,"affiliated":0.14042693376541138,"membership":0.234084352850914,"terminates":0.09581903368234634,"network":0.00763523206114769,"##0":0.1739148050546646,"can":0.2921415865421295,"database":0.3057864010334015,"computing":0.1369612216949463,"##2":0.0652971863746643,"servers":0.09310118108987808,"operations":0.031169015914201736,"##4":0.03182768076658249,"##9":0.16393490135669708,"##lib":0.2672044634819031,"privately":0.07032510638237,"terminated":0.2283426821231842,"requirements":0.20102600753307343,"cost":0.014856872148811817,"limited":0.15507537126541138,"sat":0.1666470319032669,"resources":0.19063912332057953,"threads":0.10688343644142151,"performance":0.10355531424283981,"compliance":0.14599746465682983,"user":0.2996928095817566,"account":0.31642287969589233,"customer":0.014390327967703342}},"sort":[9.424737,1775343812754]}]},"aggregations":{"places":{"doc_count":1927,"only_spatial":{"doc_count":0,"place_names":{"doc_count_error_upper_bound":0,"sum_other_doc_count":0,"buckets":[]}}},"languages":{"doc_count_error_upper_bound":0,"sum_other_doc_count":0,"buckets":[{"key":"en","doc_count":1925},{"key":"english","doc_count":188},{"key":"en_us","doc_count":59},{"key":"eng","doc_count":5},{"key":"hungarian","doc_count":1},{"key":"multiple languages","doc_count":1},{"key":"swedish","doc_count":1}]},"content_type":{"doc_count_error_upper_bound":0,"sum_other_doc_count":40,"buckets":[{"key":"article","doc_count":1515},{"key":"libguide","doc_count":629},{"key":"archival materials","doc_count":192},{"key":"thesis","doc_count":174},{"key":"website","doc_count":63},{"key":"technical report","doc_count":32},{"key":"researchdatabases","doc_count":27},{"key":"learning object","doc_count":9},{"key":"not specified","doc_count":9},{"key":"speeches (compositions)","doc_count":5}]},"subjects":{"doc_count":1927,"subject_names":{"doc_count_error_upper_bound":9,"sum_other_doc_count":1806,"buckets":[{"key":"massachusetts institute of technology -- history","doc_count":78},{"key":"interdisciplinary","doc_count":45},{"key":"massachusetts institute of technology -- faculty","doc_count":40},{"key":"business & management","doc_count":34},{"key":"social sciences","doc_count":31},{"key":"humanities","doc_count":29},{"key":"business & management, social sciences","doc_count":27},{"key":"engineering, science","doc_count":23},{"key":"academic departments","doc_count":21},{"key":"academic affairs","doc_count":16}]}},"content_format":{"doc_count_error_upper_bound":0,"sum_other_doc_count":0,"buckets":[{"key":"electronic resource","doc_count":2470}]},"literary_form":{"doc_count_error_upper_bound":0,"sum_other_doc_count":0,"buckets":[]},"source":{"doc_count_error_upper_bound":0,"sum_other_doc_count":0,"buckets":[{"key":"dspace@mit","doc_count":1751},{"key":"libguides","doc_count":629},{"key":"mit archivesspace","doc_count":192},{"key":"mit libraries website","doc_count":63},{"key":"research databases","doc_count":27}]},"contributors":{"doc_count":13460,"contributor_names":{"doc_count_error_upper_bound":55,"sum_other_doc_count":12244,"buckets":[{"key":"massachusetts institute of technology. department of electrical engineering and computer science","doc_count":207},{"key":"massachusetts institute of technology. department of mechanical engineering","doc_count":194},{"key":"massachusetts institute of technology. department of chemical engineering","doc_count":160},{"key":"massachusetts institute of technology. computer science and artificial intelligence laboratory","doc_count":152},{"key":"massachusetts institute of technology. department of physics","doc_count":125},{"key":"sloan school of management","doc_count":81},{"key":"massachusetts institute of technology. department of urban studies and planning","doc_count":80},{"key":"massachusetts institute of technology. department of earth, atmospheric, and planetary sciences","doc_count":76},{"key":"massachusetts institute of technology. laboratory for nuclear science","doc_count":75},{"key":"adam, w.","doc_count":66}]}},"access_to_files":{"doc_count":2732,"only_file_access":{"doc_count":0,"access_types":{"doc_count_error_upper_bound":0,"sum_other_doc_count":0,"buckets":[]}}}}} + recorded_at: Thu, 30 Apr 2026 22:47:38 GMT +recorded_with: VCR 6.4.0