# Advanced Querying Mongo

Importing libraries and setting up connection

In [110]:
from pymongo import MongoClient


In [111]:
client = MongoClient()

In [112]:
db = client.ironhack

In [113]:
db

Database(MongoClient(host=['localhost:27017'], document_class=dict, tz_aware=False, connect=True), 'ironhack')

### 1. All the companies whose name match 'Babelgum'. Retrieve only their `name` field.

In [114]:
# Your Code
query = {"name":{"$eq":"Babelgum"}}
list(db["companies"].find(query,{"_id":0, "name":1}))

[{'name': 'Babelgum'}]

### 2. All the companies that have more than 5000 employees. Limit the search to 20 companies and sort them by **number of employees**.

In [116]:
# Your Code
query2 ={"number_of_employees":{"$gt":5000}}
res=list(db["companies"].find(query2).limit(20).sort("number_of_employees",-1))

### 3. All the companies founded between 2000 and 2005, both years included. Retrieve only the `name` and `founded_year` fields.

In [117]:
# Your Code
query={"founded_year":{"$gte":2000, "$lte": 2005}}
res=list(db["companies"].find(query,{"_id":0, "name":1, "founded_year":1}))

### 4. All the companies that had a Valuation Amount of more than 100.000.000 and have been founded before 2010. Retrieve only the `name` and `ipo` fields.

In [118]:
# Your Code
query = {"ipo.valuation_amount":{"$gt":100_000_000}, "founded_year":{"$lt": 2010}}
res=list(db["companies"].find(query,{"name":1, "ipo":1, "_id":0}))

### 5. All the companies that have less than 1000 employees and have been founded before 2005. Order them by the number of employees and limit the search to 10 companies.

In [121]:
# Your Code
query = {"number_of_employees":{"$lt":1000}, "founded_year":{"$lt":2005}}
res = list(db["companies"].find(query).limit(10).sort("number_of_employees",1))

### 6. All the companies that don't include the `partners` field.

In [120]:
# Your Code
query3= {"partners":{"$size":0}}
res = list(db["companies"].find(query3, {"name":1, "_id":0}))

### 7. All the companies that have a null type of value on the `category_code` field.

In [119]:
# Your Code
query = {"category_code":{"$type":"null"}}
res = list(db["companies"].find(query, {"name":1, "category_code":1, "_id":0}))

### 8. All the companies that have at least 100 employees but less than 1000. Retrieve only the `name` and `number of employees` fields.

In [122]:
# Your Code
query = {"number_of_employees":{"$gte": 100, "$lt": 1000}}
res = list(db["companies"].find(query, {"name":1, "number_of_employees":1, "_id":0}))

### 9. Order all the companies by their IPO price in a descending order.

In [97]:
# Your Code

res=list(db["companies"].find({},{"_id": 0, "name": 1, "ipo.valuation_amount": 1}).sort("ipo.valuation_amount", -1))
res[:5]

OperationFailure: Executor error during find command :: caused by :: errmsg: "Sort operation used more than the maximum 33554432 bytes of RAM. Add an index, or specify a smaller limit.", full error: {'ok': 0.0, 'errmsg': 'Executor error during find command :: caused by :: errmsg: "Sort operation used more than the maximum 33554432 bytes of RAM. Add an index, or specify a smaller limit."', 'code': 96, 'codeName': 'OperationFailed'}

### 10. Retrieve the 10 companies with more employees, order by the `number of employees`

In [123]:
# Your Code
res = list(db["companies"].find().sort([('number_of_employees',-1)]).limit(10))

### 11. All the companies founded on the second semester of the year. Limit your search to 1000 companies.

In [126]:
# Your Code
query = {"founded_month":{"$gt":6}}
res = list(db["companies"].find(query, {"name":1, "founded_month":1, "_id":0}))

### 12. All the companies founded before 2000 that have an acquisition amount of more than 10.000.00

In [127]:
# Your Code
query = {"founded_year":{"$lt":2000}, "acquisition.price_amount":{"$gt":10_000}}
res = list(db["companies"].find(query, {"name":1, "founded_year":1, "acquisition.price_amount":1, "_id":0}))

### 13. All the companies that have been acquired after 2010, order by the acquisition amount, and retrieve only their `name` and `acquisition` field.

In [128]:
# Your Code
query = {"acquisition.acquired_year":{"$gt":2010}}
res = list(db["companies"].find(query, {"name":1, "acquisition":1}).sort("acquisition.price_amount",1))

### 14. Order the companies by their `founded year`, retrieving only their `name` and `founded year`.

In [102]:
# Your Code
query = {}

### 15. All the companies that have been founded on the first seven days of the month, including the seventh. Sort them by their `acquisition price` in a descending order. Limit the search to 10 documents.

In [129]:
# Your Code
query = {"founded_day":{"$lte":7}}
res = list(db["companies"].find(query, {"name":1, "founded_day":1, "acquisition.price_amount":1, "_id":0}).sort("acquisition.price_amount", -1))

### 16. All the companies on the 'web' `category` that have more than 4000 employees. Sort them by the amount of employees in ascending order.

In [130]:
# Your Code
query = {"category_code":"web", "number_of_employees":{"$gt":4000}}
res = list(db["companies"].find(query, {"name":1, "category_code":1, "number_of_employees":1, "_id":0}).sort("number_of_employees",1))

### 17. All the companies whose acquisition amount is more than 10.000.000, and currency is 'EUR'.

In [131]:
# Your Code
query = {"acquisition.price_currency_code":"EUR", "acquisition.price_amount":{"$gt":10_000_000}}
res = list(db["companies"].find(query, {"name":1, "acquisition.price_amount":1, "_id":0}))

### 18. All the companies that have been acquired on the first trimester of the year. Limit the search to 10 companies, and retrieve only their `name` and `acquisition` fields.

In [132]:
# Your Code
query = {"acquisition.acquired_month":{"$lte":3}}
res = list(db["companies"].find(query, {"name":1, "acquisition":1, "_id":0}))

# Bonus
### 19. All the companies that have been founded between 2000 and 2010, but have not been acquired before 2011.

In [133]:
# Your Code
query = {'$and':[{"acquisition.acquired_year": {'$lt': 2011}}, {'founded_year': { '$gt' : 1999 , '$lt' : 2010 }}]}
res = list(db.companies.find (query, {"_id":0, "acquisition.acquired_year":1,'founded_year':1}))

### 20. All the companies that have been 'deadpooled' after the third year.

In [108]:
# Your Code
res = db["companies"].agregate(
    [
        {"$project":{"deadpool":{"$subtract":["$deadpool_year"]}}}
    ]
)

TypeError: 'Collection' object is not callable. If you meant to call the 'agregate' method on a 'Collection' object it is failing because no such method exists.

In [109]:
list(db["companies"].find({"$where":{"this.deadpooled_year - this.founded_year > 3"} {"name":1, "founded_year":1, "deadpooled_year":1}}))

SyntaxError: invalid syntax (<ipython-input-109-0d4875d761f1>, line 1)