# Sample Elasticsearch Queries

*Query date: Wed, April 6, 2016*

### Query 1 : Count Documents by Index Type (Article, Blog, Interactive, Slideshare, or Video)

In [2]:
%%bash
curl -XPOST "$ELASTICSEARCH_HOST:9200/nytimes/_search?search_type=count&pretty" -d '
{ "aggs": { 
    "count_by_type": {
        "terms": { "field": "_type" }
    }
}}'

{
  "took" : 3,
  "timed_out" : false,
  "_shards" : {
    "total" : 5,
    "successful" : 5,
    "failed" : 0
  },
  "hits" : {
    "total" : 32663,
    "max_score" : 0.0,
    "hits" : [ ]
  },
  "aggregations" : {
    "count_by_type" : {
      "doc_count_error_upper_bound" : 0,
      "sum_other_doc_count" : 0,
      "buckets" : [ {
        "key" : "Article",
        "doc_count" : 25519
      }, {
        "key" : "Blog",
        "doc_count" : 4194
      }, {
        "key" : "Slideshow",
        "doc_count" : 1232
      }, {
        "key" : "Interactive",
        "doc_count" : 1219
      }, {
        "key" : "Video",
        "doc_count" : 499
      } ]
    }
  }
}


  % Total    % Received % Xferd  Average Speed   Time    Time     Time  Current
                                 Dload  Upload   Total   Spent    Left  Speed
  0     0    0     0    0     0      0      0 --:--:-- --:--:-- --:--:--     0100   756  100   673  100    83  11207   1382 --:--:-- --:--:-- --:--:-- 11406


### Query 2 : Count Documents by Section

In [3]:
%%bash
curl -XPOST "$ELASTICSEARCH_HOST:9200/nytimes/_search?search_type=count&pretty" -d '
{ "aggs": {
    "by_section": { "terms": { "field": "section" } }
  }
}'

{
  "took" : 7,
  "timed_out" : false,
  "_shards" : {
    "total" : 5,
    "successful" : 5,
    "failed" : 0
  },
  "hits" : {
    "total" : 32673,
    "max_score" : 0.0,
    "hits" : [ ]
  },
  "aggregations" : {
    "by_section" : {
      "doc_count_error_upper_bound" : 3,
      "sum_other_doc_count" : 12955,
      "buckets" : [ {
        "key" : "u.s",
        "doc_count" : 4581
      }, {
        "key" : "sports",
        "doc_count" : 3650
      }, {
        "key" : "world",
        "doc_count" : 3523
      }, {
        "key" : "opinion",
        "doc_count" : 2958
      }, {
        "key" : "arts",
        "doc_count" : 2869
      }, {
        "key" : "business",
        "doc_count" : 2691
      }, {
        "key" : "day",
        "doc_count" : 2691
      }, {
        "key" : "n.y",
        "doc_count" : 2187
      }, {
        "key" : "region",
        "doc_count" : 2187
      }, {
        "key" : "style",
        "doc_count" : 1551
      } ]
    }
  }
}


  % Total    % Received % Xferd  Average Speed   Time    Time     Time  Current
                                 Dload  Upload   Total   Spent    Left  Speed
  0     0    0     0    0     0      0      0 --:--:-- --:--:-- --:--:--     0100  1050  100   978  100    72  15107   1112 --:--:-- --:--:-- --:--:-- 15281


### Query 3 : Weekly Count of Documents by Published Date

In [4]:
%%bash
curl -XPOST "$ELASTICSEARCH_HOST:9200/nytimes/_search?search_type=count&pretty" -d '
{ "aggs": {
    "weekly_count": {
      "date_histogram": {
        "field": "published_date",
        "interval": "week"
      }
    }
  }
}'

{
  "took" : 6,
  "timed_out" : false,
  "_shards" : {
    "total" : 5,
    "successful" : 5,
    "failed" : 0
  },
  "hits" : {
    "total" : 32677,
    "max_score" : 0.0,
    "hits" : [ ]
  },
  "aggregations" : {
    "weekly_count" : {
      "buckets" : [ {
        "key_as_string" : "2015-11-09T00:00:00.000Z",
        "key" : 1447027200000,
        "doc_count" : 1167
      }, {
        "key_as_string" : "2015-11-16T00:00:00.000Z",
        "key" : 1447632000000,
        "doc_count" : 1512
      }, {
        "key_as_string" : "2015-11-23T00:00:00.000Z",
        "key" : 1448236800000,
        "doc_count" : 1326
      }, {
        "key_as_string" : "2015-11-30T00:00:00.000Z",
        "key" : 1448841600000,
        "doc_count" : 1573
      }, {
        "key_as_string" : "2015-12-07T00:00:00.000Z",
        "key" : 1449446400000,
        "doc_count" : 1597
      }, {
        "key_as_string" : "2015-12-14T00:00:00.000Z",
        "key" : 1450051200000,
        "doc_count" : 1722
      }, {
 

  % Total    % Received % Xferd  Average Speed   Time    Time     Time  Current
                                 Dload  Upload   Total   Spent    Left  Speed
  0     0    0     0    0     0      0      0 --:--:-- --:--:-- --:--:--     0 44  3359   42  1360  100   142  21430   2237 --:--:-- --:--:-- --:--:-- 21250100  3359  100  3217  100   142  49057   2165 --:--:-- --:--:-- --:--:-- 48742


### Query 4 : Common Terms In NYT Blog Names

In [5]:
%%bash
curl -XPOST "$ELASTICSEARCH_HOST:9200/nytimes/_search?search_type=count&pretty" -d '
{ "aggs": {
    "blog_terms": {
      "terms": { "field": "blog_name"  }
    }
  }
}'

{
  "took" : 3,
  "timed_out" : false,
  "_shards" : {
    "total" : 5,
    "successful" : 5,
    "failed" : 0
  },
  "hits" : {
    "total" : 32687,
    "max_score" : 0.0,
    "hits" : [ ]
  },
  "aggregations" : {
    "blog_terms" : {
      "doc_count_error_upper_bound" : 0,
      "sum_other_doc_count" : 1861,
      "buckets" : [ {
        "key" : "draft",
        "doc_count" : 1291
      }, {
        "key" : "first",
        "doc_count" : 1291
      }, {
        "key" : "artsbeat",
        "doc_count" : 487
      }, {
        "key" : "the",
        "doc_count" : 414
      }, {
        "key" : "learning",
        "doc_count" : 381
      }, {
        "key" : "network",
        "doc_count" : 381
      }, {
        "key" : "well",
        "doc_count" : 317
      }, {
        "key" : "iht",
        "doc_count" : 266
      }, {
        "key" : "retrospective",
        "doc_count" : 266
      }, {
        "key" : "note",
        "doc_count" : 238
      } ]
    }
  }
}


  % Total    % Received % Xferd  Average Speed   Time    Time     Time  Current
                                 Dload  Upload   Total   Spent    Left  Speed
  0     0    0     0    0     0      0      0 --:--:-- --:--:-- --:--:--     0100  1064  100   979  100    85  16303   1415 --:--:-- --:--:-- --:--:-- 16593


### Query 5 : Query Articles Related to the Batman vs Superman Movie

In [8]:
%%bash
curl -XPOST "$ELASTICSEARCH_HOST:9200/nytimes/_search?pretty" -d '
{ "query": { 
    "query_string": {
        "fields": ["title"],
        "query": "batman superman"
     }
  },
  "_source": ["_id", "url", "title"] 
}'

{
  "took" : 2,
  "timed_out" : false,
  "_shards" : {
    "total" : 5,
    "successful" : 5,
    "failed" : 0
  },
  "hits" : {
    "total" : 14,
    "max_score" : 4.3961687,
    "hits" : [ {
      "_index" : "nytimes",
      "_type" : "Article",
      "_id" : "2244",
      "_score" : 4.3961687,
      "_source":{"title":"Review: ‘Batman v Superman’ ... v Fun?","url":"http://www.nytimes.com/2016/03/25/movies/review-batman-v-superman-dawn-of-justice-when-super-friends-fight.html"}
    }, {
      "_index" : "nytimes",
      "_type" : "Article",
      "_id" : "1593",
      "_score" : 4.2483974,
      "_source":{"title":"Batman vs. Superman, by the Numbers","url":"http://www.nytimes.com/2016/03/28/movies/batman-vs-superman-by-the-numbers.html"}
    }, {
      "_index" : "nytimes",
      "_type" : "Article",
      "_id" : "1877",
      "_score" : 4.2483974,
      "_source":{"title":"‘Batman v Superman’ Battles the Critics","url":"http://www.nytimes.com/2016/03/26/movies/batman-v-superman-da

  % Total    % Received % Xferd  Average Speed   Time    Time     Time  Current
                                 Dload  Upload   Total   Spent    Left  Speed
  0     0    0     0    0     0      0      0 --:--:-- --:--:-- --:--:--     0100  3325  100  3173  100   152  53573   2566 --:--:-- --:--:-- --:--:-- 53779
