In [38]:
!pip install langchain --quiet
!pip install openai --quiet
!pip install pdf2image --quiet
!pip install tabulate --quiet
!pip install tiktoken --quiet
!pip install unstructured --quiet

In [42]:
from langchain.document_loaders import OnlinePDFLoader

loader = OnlinePDFLoader("http://leavcom.com/pdf/DBpdf.pdf")

data = loader.load()

[nltk_data] Downloading package punkt to /home/jovyan/nltk_data...
[nltk_data]   Unzipping tokenizers/punkt.zip.
[nltk_data] Downloading package averaged_perceptron_tagger to
[nltk_data]     /home/jovyan/nltk_data...
[nltk_data]   Unzipping taggers/averaged_perceptron_tagger.zip.


In [43]:
from langchain.text_splitter import RecursiveCharacterTextSplitter

print (f"You have {len(data)} document(s) in your data")
print (f"There are {len(data[0].page_content)} characters in your document")

You have 1 document(s) in your data
There are 13040 characters in your document


In [44]:
text_splitter = RecursiveCharacterTextSplitter(chunk_size = 2000, chunk_overlap = 0)
texts = text_splitter.split_documents(data)

print (f"You have {len(texts)} pages")

You have 8 pages


In [45]:
%%sql

DROP DATABASE IF EXISTS pdf_db;
CREATE DATABASE IF NOT EXISTS pdf_db;



In [46]:
%%sql

USE pdf_db;
DROP TABLE IF EXISTS pdf_docs1;
CREATE TABLE IF NOT EXISTS pdf_docs1 (
    id INT PRIMARY KEY,
    content TEXT CHARACTER SET utf8mb4 COLLATE utf8mb4_general_ci,
    vector BLOB
);



In [47]:
from sqlalchemy import *

db_connection = create_engine(connection_url)

In [48]:
import os
import getpass

os.environ["OPENAI_API_KEY"] = getpass.getpass("OpenAI API Key:")

OpenAI API Key: ········


In [49]:
from langchain.embeddings import OpenAIEmbeddings

embedder = OpenAIEmbeddings()

In [50]:
for i, document in enumerate(texts):
    text_content = document.page_content

    embedding = embedder.embed_documents([text_content])[0]

    stmt = """
        INSERT INTO pdf_docs1 (
            id,
            content,
            vector
        )
        VALUES (
            %s,
            %s,
            JSON_ARRAY_PACK_F32(%s)
        )
    """

    db_connection.execute(stmt, (i+1, text_content, str(embedding)))

In [51]:
%%sql

USE pdf_db;
SELECT JSON_ARRAY_UNPACK_F32(vector)
FROM pdf_docs1
LIMIT 1;

JSON_ARRAY_UNPACK_F32(vector)
"[-0.00875275768,-0.01528366,0.0159704164,-0.0420670994,-0.019956287,0.00651743775,-0.0108938161,-0.0048106499,-0.0272816699,-0.0188520923,0.00709646614,0.024373062,0.0162397306,0.00352803431,-0.00311396155,0.035253413,0.0252618026,0.000304452871,0.022945689,-0.0115132425,-0.00130028941,0.00434271432,-0.0214509871,-0.0063390159,-0.00987714995,0.0128732855,0.0162801296,-0.0126241688,0.0222454686,-0.00861136708,-0.000350741495,-0.00791114569,-0.00505640032,0.0053021512,-0.0143006584,0.0181922689,-0.00714359619,-0.0165090468,0.00836224947,0.0234977864,0.0177478995,0.00196600403,-0.010799556,-0.0124827782,0.0215856452,0.0211008769,0.00380408275,-0.0221646745,-0.00709646614,-0.00695507554,-0.00795154367,0.056556277,-0.0345801227,-0.00291197491,-0.00138192566,-0.000453207671,-0.0138966851,0.0145430425,-0.00413399469,-0.0118566193,0.00525502069,0.0342030823,-0.0294092633,0.000438479474,-0.0488538519,0.00967516284,0.00655446853,-0.00396567257,0.00803233776,-0.00163440907,0.0184077211,0.0494463444,-0.00182461319,0.0276048481,-0.00701567158,-0.0369501002,0.00833531842,0.00251136813,-0.00702913711,-0.0088672163,0.0169938151,-0.0432790183,-0.0188251603,-0.000306556904,0.01698035,0.0208180957,-0.0309443623,0.00863156561,-0.00669585913,0.00861136708,0.00829492044,0.0206565075,0.00456489949,0.0105841029,0.00160158623,0.0279818904,0.012173065,0.0140986713,-0.0126712993,-0.00961456727,-0.0163609236,0.00146019552,-0.022959156,-0.00529878447,-0.0138966851,0.0212624669,0.026002422,-0.0168052949,0.0154183181,-0.0291938111,-0.0179229546,0.0376503207,0.0141794663,0.00852383953,0.00725805527,-0.00729845278,0.00971556082,-0.0252483375,7.67312758e-06,-0.0136206364,0.0124558462,0.0192022026,0.00785055012,-0.0365461297,0.000610588992,0.00261404458,-0.00652080402,0.0121394005,0.0315907225,-0.00298098708,0.00737251434,0.0297593735,-0.00373338745,0.0295169894,-0.00552433636,0.0218684264,-0.0215048511,0.0113045229,-0.0115940366,-0.0722843111,0.0239825547,0.00931158755,-0.00188184273,0.00972902589,-0.00465242704,0.0180980098,0.0195792448,0.0211547408,0.00411379617,-0.0155529762,0.0179902818,0.00374685321,-0.0133580538,0.00943277963,0.0173977893,-0.00623128982,-0.0096347658,0.026015887,-0.0096347658,-0.0279549584,0.0110150082,0.0259350929,-0.00295742205,0.0253425986,0.0203602593,0.0153375231,0.01698035,0.0170207471,0.000592073542,-0.0116411671,0.00461876253,0.0391315594,-0.0269046277,0.0108130211,0.00538631203,-0.00235987804,0.00571622374,0.0164417177,-0.02597549,-0.0336375199,0.0195388477,0.00513719535,0.0104494458,0.0209392887,-0.00590474438,0.00553443562,0.00622455683,0.0105706379,-0.0101599311,0.0013592022,0.0179768167,0.0150278108,0.0102070617,-0.0019474884,-0.62825942,-0.00617069378,-0.0126039702,-0.0411244929,-0.00757450098,0.0137014315,0.0150951389,0.0158088263,0.000353055919,0.0249655563,-0.00727825426,-0.00125820888,0.00570612447,-0.0287090428,-0.0127722928,-0.0110419402,0.00633228291,-0.00408686465,-0.00679685269,0.00420468999,-0.00810640026,0.0106446994,0.00497897249,-0.0142737264,-0.0177882966,0.016791828,-0.00420468999,0.0157818943,0.0101599311,0.0177075006,0.00405656639,0.00316445832,0.0164955817,0.00143578881,0.0404242724,0.00320653897,-0.0116277011,0.0164147858,0.0374348685,0.0403704084,-0.00545027433,-0.0192022026,0.00657803332,0.00108399533,-0.0166302398,0.00583741581,0.0253695305,-0.0191348735,-0.0021730403,-0.0135735059,-0.0015073258,-0.000240700814,-0.0182192009,-0.0209123567,0.024319198,-0.000477193564,0.0179094877,-0.0336913839,0.019929355,0.00273523666,0.012987745,0.0196061768,-0.026069751,-0.012199997,-0.0326949172,0.0189867504,-0.019929355,0.0124423811,0.0235112514,-0.0218818933,-0.0215048511,0.031994693,0.000409864675,-0.0232688673,0.000643411826,0.00216294103,0.0242114719,0.00922405999,-0.0272278078,0.0241037458,0.018394256,-0.0246827751,-0.0135196429,0.00493520871,0.0277125761,0.00592157664,-0.00978962239,-0.0158222914,-0.00851710606,-0.0169938151,0.0120720714,0.0141390692,-0.00715032918,-0.0043864781,0.0162801296,0.0355496593,-0.0254637897,-0.00449420419,0.000994784525,-0.0110890698,-0.00454806723,-0.00668239314,0.00457836548,0.0248308983,-0.0185827762,0.0338799022,0.00603266945,0.028897563,0.0281165484,-0.00960783474,0.00497223949,-0.0021545249,0.00766202854,0.019808162,-0.00725805527,-0.00911633298,0.0253156666,0.00359199685,-0.0194849838,-0.0254368577,0.00607306696,-0.00403973414,0.0192022026,-0.0430097021,-0.0155395102,-0.00471975608,0.0112775909,0.011466112,0.00569939148,-0.00213264301,0.00270998827,-0.0154587151,0.0131560666,-0.0246693101,-0.0032048556,0.00082982867,0.00935871713,-0.010732227,-0.0142198633,-0.0232957993,-0.000155382484,-0.0226090457,0.00710319914,-0.0141660003,-0.00882008579,-0.0233631283,-0.0317792408,0.0267834365,-0.0267026424,-0.00366942515,-0.01372163,-0.0125097102,-0.0226763748,0.0189328864,0.00312742754,0.00154856476,-0.0147584947,-0.0251136795,-0.0370847583,-0.004598564,-0.0094933752,0.00440667663,-0.0145969056,0.0040498334,-0.00177916617,-0.055155836,-0.0186097082,0.0200640131,-0.0182192009,-0.0270258207,-0.00602930319,-0.0195657797,0.0240633488,-0.00820739288,-0.0148123577,-0.00335971219,-0.0290052909,0.000344429398,0.0499311127,-0.0197004359,0.00798520818,-0.00798520818,0.00381754851,-0.0159300193,0.0141660003,-0.0181653388,0.0065645678,0.0100656711,-0.00219997182,0.00584751507,0.021424057,0.044329349,-0.00806600228,0.000767128658,-0.00745330937,-0.0108870836,-0.0192022026,0.00111513492,-0.00173876889,0.030513458,0.0286282487,0.000732622575,-0.00477361912,0.00836898293,0.0103349863,0.00518769166,-0.0122807911,-0.00457499875,0.0112035293,0.00906246994,0.0157818943,0.000567245996,0.0134927118,-0.0161050744,0.00353813358,0.0410436988,-0.00313920993,0.0208854247,-0.0263121333,-0.0045413347,-0.00603603572,0.0143410554,0.0361690857,0.00428548455,0.0178960226,-0.00585088134,0.00410369644,0.0179229546,0.0142063983,-0.0233631283,-0.00542334281,0.00463559479,0.00656793406,0.00655446853,0.0129271485,0.0267161075,0.0446525253,-0.0434675403,0.0220973454,0.000345060631,-0.0195792448,0.038377475,0.0164417177,-0.000757870963,0.000956912001,-0.00674635591,0.0237536356,0.0128665529,-0.026069751,0.00120939536,-0.0146238366,0.00346070551,-0.0136610335,0.009210594,-0.00203333283,-0.0213567279,0.0166167729,0.0112439264,0.0408282466,0.000655194395,0.00144757133,0.00263087684,0.0122201955,-0.00533244899,0.012159599,0.0129406145,0.00682715047,0.0123885181,-0.00257028081,0.000924930733,-0.0131829986,-0.0277664382,-0.00236492767,0.00904900488,-0.00607306696,0.0288437009,-0.0215452481,0.00129523978,0.0097761564,0.0293015372,-0.00629861886,-0.0253022015,-0.00500590401,0.00952703971,0.00239859219,-0.0190136824,-0.0284666587,0.0173977893,-0.00741964485,-0.00162262644,0.00190709112,0.0255580507,0.000535685569,0.00493857497,0.015310592,0.0122201955,0.0418785773,-0.0163878556,-0.0243057329,-0.00169752992,0.0128665529,-0.000221343755,0.00280929846,-0.024467323,0.0617271364,-0.0294900574,0.00976942386,-0.018488517,-0.0170476791,-0.00870562717,-0.0203063972,-0.0210739467,-0.0250059534,0.0189598184,0.0103888493,-0.0175593775,0.0027857332,0.00479045138,0.0324525312,0.0217876323,0.0127251623,-0.032290943,-0.00989061594,0.0098367529,0.0537015311,-0.0196196418,-0.0211547408,0.0328834355,-0.0112439264,-0.0180037487,-0.021531783,-0.0247097071,0.00573978899,0.0203063972,-0.0154721811,0.00255176541,0.0439253747,-0.000243225644,-0.00108399533,0.00278236694,0.0087258257,-0.0406935886,0.00341357524,-0.0104898429,-0.0421748236,-0.0204814523,0.00980308838,0.0281973425,0.041151423,-0.00405320013,0.0437099226,0.0394008718,0.0189328864,-0.0257331058,-0.0188924894,0.0160916075,-0.00857770257,0.0130079435,-0.00232453039,0.0180710778,0.00324525288,-0.0112304604,-0.00711666467,0.00987041742,0.0147584947,0.0119845439,0.0153509891,-0.0156068392,-0.0187982302,-0.00809293427,-0.00204679859,0.0115873041,-0.018394256,-0.0199697521,-0.0292207431,-0.000961961632,-0.0138966851,0.0156203043,-0.0107254935,-0.00578691904,-0.0219896194,-0.00770915905,-0.0155933732,-0.0288706329,-0.0123413876,-0.0025770138,0.0590878427,-0.00767549453,0.00490827672,-0.00268642325,-0.0147854267,-0.00246592099,-0.0295439214,-0.0140852062,0.0145430425,-0.0331258215,-0.0266487785,-0.000753662898,0.0346070565,0.00248611975,0.00989061594,0.00527858594,0.00123464374,-0.00925772451,-0.0120855374,-0.0193907246,-0.0177478995,-0.0360074975,-0.0292746052,0.0141929323,-0.0109072821,0.00435281359,-0.012920416,0.000956070377,-0.00209224573,-0.0406397246,0.0278472323,0.000725468912,0.0258138999,0.0103821168,0.0330719575,0.0124356477,-0.00309039652,-0.035064891,-0.0313214064,0.0205353145,-0.0221781395,-0.0421478935,0.02597549,0.0103147877,-0.0191752706,0.00415755995,0.00934525207,-0.00131964649,0.00582731655,-0.0281434804,0.018461585,-0.00904900488,0.0162262656,-0.00256859767,0.00329406653,0.0350110307,0.0096953623,-0.00768896053,-0.0131695326,-0.00358863035,0.0292746052,-0.0134119168,-0.0305673201,0.0240902808,-0.00943951216,-0.0363037437,-0.0133984508,-0.0161589365,0.0144218504,0.0228648949,-0.012159599,-0.0149335498,-0.0104561783,-0.00441340962,0.00317960721,0.00941931363,-0.0280896164,-0.0130954711,0.0124289151,-0.00162010163,0.0209796857,-0.0206161104,0.0089278128,-0.0220973454,-0.0143949185,0.0155933732,0.035307277,0.0114189815,-0.0178690907,-0.0179498848,-0.00573305599,0.000917356287,0.0173304603,-0.0400202982,-0.00465916004,-0.0266353134,0.0359536335,0.00785728265,0.0256253798,-0.0142871924,0.0250867475,0.00967516284,-0.000598806422,-0.00641307794,-0.0120518729,-0.0254099276,-0.0172631312,-0.0133243892,-0.0132839922,0.0131089371,-0.0146238366,0.0153375231,0.0171823353,0.0139101511,-0.0116075026,-0.0116075026,-0.0300017577,-0.0166571699,-0.00573642226,0.00081972935,0.00404646713,-0.00479718437,-0.0248308983,0.0064871395,0.0174516514,0.0109880762,0.0146911656,-0.027389396,0.0134321153,0.00688101351,0.0101733971,-0.0176536385,-0.0039724051,-0.0192560665,0.0202660002,-0.0282512065,-0.0197139028,0.00820739288,0.00904900488,0.0310790204,0.0221781395,0.00242047408,0.0045413347,0.00311901141,-0.00632218365,-0.0170072801,-0.00729171978,-0.0148123577,0.00871909317,-0.0181653388,-0.0269315597,-0.0153240571,0.00106716307,0.0295169894,0.0167783629,0.0149739468,-0.0148662208,-0.0304057319,0.038323611,-0.022905292,0.033583656,-0.0209258217,0.0283858646,0.0102945892,0.00943277963,-0.0142602613,-0.0123817846,0.0141660003,-0.0141390692,0.0391584896,0.027429793,-0.0026594915,-0.00565226143,0.0129271485,-0.0277125761,-0.0160916075,-0.0377580486,-0.000467094244,0.00896147732,0.00249621901,-0.0122605925,0.00326040201,-0.0117219612,0.0296247154,-0.00252483389,-0.00585761433,-0.00253325002,-0.0119980099,-0.00985021796,0.0302710738,-0.0300286897,0.0153913861,-0.0291668791,-0.0280357543,-0.0114257149,-0.0236593764,0.00577345304,-0.00591147738,0.00736578181,0.0196869709,0.00640297821,0.00180609769,0.0231611412,0.00335802883,0.00370645593,-0.0154991131,-0.00287157763,0.0214509871,-0.00810640026,-0.0227841008,0.0332604796,0.0176267065,-0.0193233956,-0.0162397306,-0.0111496663,-0.0142871924,-0.0109274806,0.0113583859,-0.00748024089,0.00196937053,0.00628515286,0.0162935946,-0.0176401716,-0.0346609205,-0.0181249399,-0.00241879071,0.00449757045,-0.0162262656,-0.0264198612,0.0151086049,-0.00795154367,0.0128059564,-0.0226629078,-0.00614712853,0.0206969045,0.0127251623,-0.0325333253,-0.002859795,0.0235516503,-0.00716379471,-0.041151423,0.0125568397,-0.0201717392,-0.00598553941,0.0273355339,-0.0146911656,0.012974279,-0.0210604798,0.00546374032,-0.0106110349,-0.00470965682,-0.00842957851,0.00703587011,0.00194412202,0.033583656,-0.0284935907,-0.0292476732,0.0392662138,-0.00242720684,-0.00946644321,-2.69578595e-05,-0.00633228291,0.0117286947,0.00985695142,-0.00900187436,-0.00284127961,-0.0411783569,-0.00306178164,-0.0394278057,0.0339068361,-0.0208450276,0.012213463,-0.0217876323,0.0149335498,-0.0206026435,0.0233361963,0.00856423657,0.0313483365,0.0207507666,-0.00574988825,0.0257061739,0.0133445878,-0.00456826622,-0.0220569484,-0.00546037406,-0.00968862884,-0.0423364118,-0.00480055064,-0.00545364106,0.0288706329,0.013748561,-0.0224205237,-0.0194580518,-0.000234809544,-0.0494194143,0.00249621901,0.0204141233,0.0177075006,0.0257600378,0.0236593764,0.0179094877,0.0273355339,0.00528531894,-0.00549067184,-0.0507659912,-0.0121663325,-0.0159838814,0.000425013684,0.0306481142,-0.00795154367,-0.0396432579,-0.0111967959,-0.0096212998,-0.0174381863,0.0170746092,0.0206295755,0.013055074,-0.00627168687,0.000824779039,-0.00871909317,-0.00401953561,0.0279549584,0.0134119168,-0.0315907225,0.0023699773,0.0165629108,0.0301094837,0.0211547408,-0.00493184198,-0.0140582742,0.00331089855,0.0100252731,0.00296415482,0.00828818791,0.0102407262,0.0159030873,-0.0065578348,0.00384784653,0.00101077522,0.0485306717,-0.0125635732,-0.00631881738,0.00682041747,-0.0211682059,-0.0139505481,-0.000413862319,-0.00770915905,-0.0200101491,0.00935871713,-0.0432520844,-0.00511699636,-0.0163609236,0.00706280163,-0.00477025285,-0.000863493129,-0.0336375199,-0.00156455534,0.00502273627,-0.00950010773,0.00141306536,-0.00247433712,0.00654436927,-0.0227437019,-0.00875949021,0.00573978899,-0.00639624568,-0.0390238315,0.01528366,-0.00970882736,-0.0208988916,-0.0126174362,-0.00325703551,-0.0143275894,0.00577681977,0.192937702,0.00922405999,4.6025616e-05,0.0333143398,0.00849017501,-0.00724458974,0.00900187436,-0.0192425996,0.0172631312,0.0252483375,-0.0147450287,0.0180845428,-0.000300034415,0.0045413347,0.0282242745,-0.0233631283,-0.0378388427,-0.01225386,-0.00623465609,0.0308097042,-0.0127790254,-0.00998487603,-0.0215048511,-0.0133445878,0.0341222882,-0.0133311218,-0.0132839922,0.00800540671,0.0382428169,0.000427538529,0.00397577183,-0.0301364157,0.00798520818,0.0110419402,0.00242889021,-0.0104359798,0.000252693804,-0.0192829967,0.00901534036,-0.00608653249,0.0252752695,0.0116142351,0.0164686497,0.00590137811,0.0301902778,0.0251944754,-0.00424172077,0.00831511989,0.00297762058,-0.0142602613,-0.024319198,0.015243263,0.00439657737,0.0151355369,-0.00557483314,0.0132503277,0.0241306778,0.0167110339,-0.0051001641,0.00082646223,-0.00303485012,0.0173843224,-0.0109409466,-0.0110284742,-0.00818719435,-0.00955397077,-0.0150008788,0.0274971221,0.000485188881,-0.0189463533,0.00873929169,-0.0107389595,-0.00882681925,-0.0149066187,-0.0201313421,-0.00852383953,0.0221781395,0.0231746081,-0.00399260409,0.00647367397,-0.00191887363,-0.0139909452,-0.0277664382,0.00724458974,-0.00960783474,-0.00880662072,0.0109274806,-0.0204410553,0.00521798991,-0.0200640131,-0.0089278128,-0.00712339766,-0.0187174343,-0.0151759339,-0.00143410556,-0.00496550649,-0.0125231752,0.0182057358,-0.0233227313,-0.0240229517,-0.019902423,0.0860732645,0.0420401655,0.000785223325,0.00729845278,-0.000281939778,0.00282949698,0.0166975688,0.0300556216,0.0066217971,0.012267326,-0.0330180936,0.00355833233,-0.0140717402,0.0106312335,-0.00381754851,0.00974922534,-0.0117017627,-0.00298772007,-0.0215183161,-0.000984685263,-0.010678364,0.00438311137,-0.0017842158,-0.0235381834,0.0145295765,0.0104561783,0.0124895107,-0.0131762661,-0.0218145642,0.0271066148,-0.0424980037,0.00134068669,0.00454470096,0.0207642335,-0.00491500972,0.0269988887,-0.0134523138,-0.00408686465,0.0116344336,0.00605960097,0.0211682059,0.0197946969,0.0258408319,0.0212355349,0.0128732855,-0.0100724036,0.00379398349,-0.00254334928,-0.0174112543,-0.000735147449,-0.00985021796,0.00831511989,0.00574315526,0.00188015949,-0.00799867325,-0.0158222914,-0.0158896204,0.0186231751,0.0180980098,-0.0438984446,0.00462549552,0.0403704084,-0.000457836519,-0.000183576456,-0.0116007701,-0.170099735,0.0394816697,0.012159599,-0.0215452481,0.030459594,-0.0162666626,0.00471638981,-0.00417102547,0.00754083693,-0.00251136813,0.00138445047,-0.00145262107,-0.0517355278,-0.00816699583,0.0181384068,0.00434608059,0.0155529762,0.0128126899,0.0432790183,0.0124558462,0.0285474528,-0.00853730459,0.0190944765,-0.0231072791,0.00926445704,0.0158357583,-0.0160646755,0.0276856441,-0.0109611452,-0.0276317801,0.0118768178,-0.0144891795,0.0363576077,0.00148207741,-0.00828145538,0.0146777006,-0.00852383953,0.00023838639,-0.00380071648,0.0145969056,0.0150547419,0.0348225087,0.00350110279,0.0373002104,0.0108736176,0.0267699715,0.0190810114,-0.0329911634,0.00679011969,-0.004191224,0.0187174343,-0.0279010963,0.0228514299,-0.00574652152,-0.0125164427,0.00189025886,0.00423498778,0.0239152256,-0.0249520913,-0.0200640131,-0.00708973315,-0.0273489989,0.0100858696,-0.00455816649,-0.00465579377,-0.0230130181,0.00636258116,0.00447737193,-0.028978359,0.0127588268,-0.00040565661,0.00704933563,0.00861136708,0.0196735058,-0.0220838804,0.00685408199,0.0126847653,0.00573305599,0.0215721801,0.00766202854,0.00140885729,-0.00753410393,0.00659149932,0.0131426016,-0.00455143396,-0.00508669857,0.00786401611,0.0209123567,0.0208315626,0.018421188,0.044517871,-0.0464569405,-0.00865176413,0.00414746022,-0.000491080165,0.00147618609,0.00748697342,0.003827648,0.0175593775,0.00483421516,0.0155125782,0.0191483404,0.00242047408,-0.00928465556,0.0339068361,-0.00229423237,-0.000125715684,-0.0200370811,0.0524626784,0.00472985534,-1.71872798e-05,0.0303787999,0.0264737234,0.0124423811,-0.0058609806,0.0116546331,0.0076081655,-0.00861809961,0.0144622475,-0.00945297815,0.0388622433,0.0025181009,-0.00647367397,-0.0110150082,-0.00752063794,-0.033826042,-0.107079886,-0.0183403939,0.0257061739,0.0210739467,-0.0182057358,0.00343714026,-0.00380744925,0.035495799,-0.0296785794,0.0201044101,-0.0115132425,-0.00521125691,-0.00917692948,-0.00645347498,0.0277933702,0.00396230584,0.000925772358,-0.005726323,-0.00365932565,0.0312675424,0.0062043583,-0.000693487702,0.00190372462,-0.0124625796,-0.0118970163,-0.0178556256,-0.0363037437,0.00833531842,0.00509006483,0.00152584119,-0.00874602422,-0.0290322211,0.0131628001,-0.0255715158,-0.0105235074,0.0015653969,-0.045999106,0.0127116963,0.0224205237,-0.0347417146,0.0185423791,0.0146911656,0.00470965682,-0.0127924914,-0.0160781424,-0.0222993325,0.00180778094,-0.0138832191,0.0269180946,-0.0114728445,-0.0188790243,-0.0365461297,-0.00610673148,-0.00758796697,0.0108803501,0.00925772451,0.0146911656,0.000181998432,-0.0043157828,0.0103888493,-0.0088537503,0.0108130211,-0.00652753701,0.0262044072,-0.00970882736,-0.00337486109,-0.00961456727,-0.0093385186,-0.0124423811,-0.0227167718,-0.0172092672,0.00614376226,-0.0349840969,-0.0146373026,0.00110756047,0.0312136784,-0.0376503207,-0.0305403881,0.000629104441,-0.0165359788,-0.0206026435,-0.0218818933,-0.0283050686,-0.0204410553,0.0316176526,0.0188520923,-0.00675645517,-0.0171554051,0.0210200828,-0.0273624659,-0.0206430405,0.00442350889,0.0145026455,-0.0189328864,0.00927118957,0.00793134514,-0.0108130211,-0.00768222753,0.0194176547,-0.015270194,-0.00993101299,0.0201986711,-0.0416361913,0.0208584946,0.00150900893,0.0074735079,-0.00687764725,0.00475005386,0.00308703003,-0.039616324,0.0147450287,0.0198485609,-0.0316984467,-0.00542334281,-0.0121461339,-0.00953377225,-0.0507929213,-0.0236189775,0.0146777006,-0.0025214674,-0.0103955828,0.0132570602,0.00386131229,0.0111900633,0.00805253722,0.0271604788,-0.00646694098,0.000301507243,-0.00674635591,0.00725805527,-0.0146507686,-0.0154317841,0.0131628001,-0.0318600386,-0.00986368395,0.0103417197,-0.0215048511,-0.022905292,-0.00516749313,0.0219088253,0.0329642296,0.0391046256,-0.0321562849,-0.0423094817,0.00414409395,-0.00870562717,-0.0223935917,-0.00432251533,-0.00302980049,-0.0131964646,-0.00859790109,-0.0375156626,0.0159838814,0.0199428201,-0.00565899396,-0.0181788038,-0.00492174271,0.00712339766,0.0180441458,0.00954723824,0.0108668851,-0.0140448082,0.036734648,0.0127453608,-0.0173035283,-0.0108062886,-0.019808162,-0.0294092633,-0.012173065,-0.00236156117,0.00440331036,0.00253156666,-0.0181518719,0.00387477828,0.00540987728,-0.00411379617,0.0161993336,0.00725132274,0.00533244899,-0.00283622998,-0.00667229388,0.0236997735,0.0124221826,-0.0136341024,-0.0156203043,0.01698035,0.0237267055,0.0159434844,0.00069475011,0.0193503257,0.00970882736,0.0105975689,-0.0133513212,0.0209123567,-0.022837963,-0.000100151738,-0.0200909451,0.00518769166,-0.0172092672,0.011452646,-0.00541661028,0.0209258217,0.00915673096,-0.0132839922,-0.00632555038,-0.0281973425,-0.0205487814,0.0164147858,-0.0332874097,-0.0141121373,-0.0192560665,0.038269747,-0.0189463533,-0.00322000473,0.0111160018,0.00842284597,-0.00497897249,-0.0327757113,-0.0187039692,-0.0491770282,-0.00632891664,0.0182461329,0.00114879943,0.0321562849,0.00347417127,-0.0254368577,0.0173169933,0.0160377454,0.0126174362,-0.0343646705,0.00053610641,-0.0224205237,0.0133378552,-0.00334456307,0.00940584764,-0.0150547419,-0.015162468,-0.0142063983,-0.0300017577,0.0226359759,0.0225686468,0.042740386,0.0141256033,-0.0155664412,0.012933882,-0.0210604798,0.0114324475,0.0040498334,-0.00171267893,-0.00308871339,-0.0453527495,0.0408821106,-0.00651743775,0.00591147738,-0.0134657798,0.00962803327,0.0125299087,-3.76095022e-06,0.00311396155,0.000811734062,0.00443697488,0.0185962431,-0.00997141004,0.00545700733,0.000479718408,-0.00687764725,-0.0108601516,0.0122471265,0.000885375019,-0.0010015174,-0.0423902757,0.00789094716,-0.00157633785,-0.0104292473,0.00159990299,0.0102609247,-0.0210604798,0.00634238264,-0.0237805676,0.011493043,0.00284969574,0.00395557284,0.0121394005,-0.0116748316,-0.0242384039,-0.00463222852,0.0029372233,0.000373465009,-0.0133580538,-0.00799194071]"


In [52]:
query_text = "Will object-oriented databases be commercially successful?"

query_embedding = embedder.embed_documents([query_text])[0]

stmt = """
    SELECT
        content,
        DOT_PRODUCT_F32(JSON_ARRAY_PACK_F32(%s), vector) AS score
    FROM pdf_docs1
    ORDER BY score DESC
    LIMIT 1
"""

results = db_connection.execute(stmt, str(query_embedding))

for row in results:
    print(row[0])

I N D U S T R Y T R E N D S

Whatever Happened to Object-Oriented Databases?

are gaining in popularity and are ex- pected to outsell even relational data- bases by 2003. And OO databases (see the “OO Database Orientation” sidebar) are still minor players with solid but strictly niche markets. Sales of relational databases have grown considerably faster than the sales of OO databases, and annual worldwide RDBMS revenues are now about 50 times larger.

Rick Cattell, distinguished engineer at Sun Microsystems, indicated, “Object- oriented databases are doing just ﬁne, and the news of their demise is highly exag- gerated. While their market [share] isn’t as big, they continue to be used in areas like CAD (computer-aided design) and telecommunications, where RDBMSs are not well suited.”

Neal Leavitt

A couple of years ago, industry

However, said Michael Stonebraker, chief technology ofﬁcer at Informix and an ORDBMS proponent and pioneer, “ODBMSs occupy a small niche market that has no br

In [53]:
import openai

prompt = f"The user asked: {query_text}. The most similar text from the document is: {row[0]}"

response = openai.ChatCompletion.create(
    model="gpt-3.5-turbo",
    messages=[
        {"role": "system", "content": "You are a helpful assistant."},
        {"role": "user", "content": prompt}
    ]
)

print(response['choices'][0]['message']['content'])

Based on the information provided in the document, it seems that object-oriented databases have not become commercially successful in the overall database marketplace, and remain a niche technology with limited market share. Sales of relational databases continue to outstrip that of object-oriented databases, although there are certain specialized industries where object-oriented databases are still used. While the industry initially touted them as being on the rise and well-suited for the Internet age, this trend has not materialized at the scale that some expected.
