# Test Deep Search Plugin

Just press `►►` and check for errors.

### Prep

In [None]:
# Move test files into your workspace
import os
import pandas as pd

# Patents csv file
patents_path = os.path.join(os.getcwd(), 'files', 'my_patents.csv')
%openad import from '{patents_path}' to 'my_patents.csv'

# Patents dataframe
my_patents_df = pd.read_csv(patents_path)

<br>
<h2><u><b>Plugin Help</b></u></h2>

In [None]:
%openad deep search

In [None]:
%openad deep search ?

In [None]:
%openad ? deep search

In [None]:
%openad ds

In [None]:
%openad ds ?

In [None]:
%openad ? ds

<br>
<h2><u><b>Molecules</b></u></h2>

### Search for molecules similar to

In [None]:
# Command help
%openad ds search for molecules similar ?

In [None]:
# Without quotes
%openad ds search for molecules similar to CC(=CCC/C(=C/CO)/C)C

In [None]:
# With quotes
%openad ds search for molecules similar to 'C1(C(=C)C([O-])C1C)=O'

In [None]:
# Save as
%openad ds search for molecules similar to CC1=CCC2CC1C2(C)C save as 'similar_mols.csv'

In [None]:
# Save as, no extension
%openad ds search for molecules similar to CC1CCC2C1C(=O)OC=C2C save as 'similar_mols'

In [None]:
# Data API
df = %openadd ds search for molecules similar to CC(=CCC/C(=C/CO)/C)C
df

<br>

### Searchj for molecules with substructure

In [None]:
# Command help
%openad ds search for molecules with substructure ?

In [None]:
# Without quotes
%openad ds search for molecules with substructure C1(C(=C)C([O-])C1C)=O

In [None]:
# With quotes, save as
%openad ds search for molecules with substructure 'C1=CCCCC1' save as 'my_mol'

In [None]:
# Data API
df = %openadd ds search for molecules with substructure C1(C(=C)C([O-])C1C)=O
df

<br>

### Search for molecules in patents

In [None]:
# Command help
%openad ds search for molecules in patents ?

In [None]:
# From list
%openad ds search for molecules in patents from list ['CN108473493B','US20190023713A1']

In [None]:
# From file
%openad ds search for molecules in patents from file 'my_patents.csv'

In [None]:
# From dataframe
%openad ds search for molecules in patents from dataframe my_patents_df

In [None]:
# Data API
data = %openadd ds search for molecules in patents from list ['CN108473493B','US20190023713A1']
data

<br>
<h2><u><b>Collections</b></u></h2>

### List all collections

In [None]:
# Command help
%openad ds list all collections ?

In [None]:
# Basic
%openad ds list all collections

In [None]:
# With details
%openad ds list all collections details

In [None]:
# Save as
%openad ds list all collections save as 'all_collections.csv'

In [None]:
# Data API
data = %openadd ds list all collections
data

<br>

### List all domains

In [None]:
# Command help
%openad ds list all domains ?

In [None]:
# Basic
%openad ds list all domains

In [None]:
# Save as
%openad ds list all domains save as 'all_domains'

In [None]:
# Data API
data = %openadd ds list all domains
data

<br>

### List collections containing

In [None]:
# Command help
%openad ds list collections containing ?

In [None]:
# Simple search
%openad ds list collections containing 'Ibuprofen'

In [None]:
# Quoted search
%openad ds list collections containing '"blood-brain barrier"'

In [None]:
# Complex search
%openad ds list collections containing 'main-text.text:("power conversion efficiency" OR PCE) AND organ*'

In [None]:
# Data API
data = %openadd ds list collections containing 'Ibuprofen'
data

<br>

### List collections for domain(s)

In [None]:
# Command help
%openad ds list collections for domain ?

In [None]:
# Single domain
%openad ds list collections for domain 'Business Insights'

In [None]:
# Multiple domains
%openad ds list collections for domains ['Materials Science','Scientific Literature']

In [None]:
# Data API
data = %openadd ds list collections for domain 'Business Insights'
data

<br>

### List collection details

In [None]:
# Command help
%openad ds list collection details ?

In [None]:
# By name
%openad ds list collection details 'Patents from USPTO'

In [None]:
# By key
%openad ds list collection details 'patent-uspto'

In [None]:
# Data API
data = %openadd ds list collection details 'Patents from USPTO'
data

<br>

### Search collection

In [None]:
# Command help
%openad ds search collection ?

In [None]:
# regular search
%openad ds search collection 'arxiv-abstract' for 'ide("power conversion efficiency" OR PCE) AND organ*' USING (limit_results=10 slop=0) show (docs)

In [None]:
# Slop
%openad ds search collection 'arxiv-abstract' for '"power efficiency"' USING (slop=0) estimate only
%openad ds search collection 'arxiv-abstract' for '"power efficiency"' USING (slop=1) estimate only
%openad ds search collection 'arxiv-abstract' for '"power efficiency"' USING (slop=5) estimate only

In [None]:
# Show data with molecules
%openad ds search collection 'pubchem' for 'Ibuprofen' show (data)
%openad result open

In [None]:
# Show data
%openad ds search collection 'patent-uspto' for '"CC(CCO)CCCC(C)C"' show (data)

In [None]:
# Show docs
%openad ds search collection 'patent-uspto' for '"CC(CCO)CCCC(C)C"' show (docs)

In [None]:
# Data API
data = %openadd ds search collection 'arxiv-abstract' for '"power conversion efficiency"' USING (slop=0)
data

<br>
<h2><u><b>Patents</b></u></h2>

### Search for patents

In [None]:
# Command help
%openad ds search for patents ?

In [None]:
# Smiles unquoted 
%openad ds search for patents containing molecule CC(C)(c1ccccn1)C(CC(=O)O)Nc1nc(-c2c[nH]c3ncc(Cl)cc23)c(C#N)cc1F

In [None]:
# Smiles quoted
%openad ds search for patents containing molecule 'CC(C)(c1ccccn1)C(CC(=O)O)Nc1nc(-c2c[nH]c3ncc(Cl)cc23)c(C#N)cc1F' save as 'patents'

In [None]:
# InChI
%openad ds search for patents containing molecule InChI=1S/C24H20ClFN6O2/c1-24(2,18-5-3-4-6-28-18)19(9-20(33)34)31-23-17(26)7-13(10-27)21(32-23)16-12-30-22-15(16)8-14(25)11-29-22/h3-8,11-12,19H,9H2,1-2H3,(H,29,30)(H,31,32)(H,33,34)

In [None]:
# InChIKey unquoted
# Note: No molecule preview for InChIKey identifier
%openad ds search for patents containing molecule JUPUMSRQQQUOLP-UHFFFAOYSA-N save as 'patents'

In [None]:
# InChIKey quoted
%openad ds search for patents containing molecule 'JUPUMSRQQQUOLP-UHFFFAOYSA-N'

In [None]:
# Data API
data = %openadd ds search for patents containing molecule JUPUMSRQQQUOLP-UHFFFAOYSA-N
data

<br>

### Enrich molecule working set with Deep Search analysis

In [None]:
%openad clear analysis cache
%openad clear mols

sm1 = 'CC(=O)N1CCC2(CC1)C3=C(C=CC(=C3)C#CC4C(C(C(C(O4)CO)O)O)O)C5=C2C=C(C=C5)C#CC6C(C(C(C(O6)CO)O)O)O'
sm2 = 'C1(C(=C)C([O-])C1C)=O'
x = %openadd ds search for patents containing molecule '{sm1}'
x = %openadd ds search for molecules similar to '{sm2}'
%openad add molecule '{sm1}' force
%openad add molecule '{sm2}' force
%openad enrich molecules with analysis
# %openad display mol '{sm}'
%openad show mol '{sm1}'
%openad show mol '{sm2}'