diff --git a/src/examples/notebooks/vectorize.ipynb b/src/examples/notebooks/vectorize.ipynb index 45874b3..54cc857 100644 --- a/src/examples/notebooks/vectorize.ipynb +++ b/src/examples/notebooks/vectorize.ipynb @@ -192,9 +192,10 @@ { "cell_type": "code", "source": [ - "import urllib3, json, os\n", + "import urllib3, json, os, mimetypes\n", "http = urllib3.PoolManager()\n", "file_path = \"apple.pdf\"\n", + "content_type, _ = mimetypes.guess_type(file_path)\n", "\n", "uploads_api = v.UploadsApi(api)\n", "\n", @@ -203,13 +204,13 @@ "upload_response = uploads_api.start_file_upload_to_connector(\n", " org, source_connector_id, v.StartFileUploadToConnectorRequest(\n", " name=file_path.split(\"/\")[-1],\n", - " content_type=\"application/pdf\",\n", + " content_type=content_type,\n", " # add additional metadata that will be stored along with each chunk in the vector database\n", " metadata=json.dumps(metadata))\n", ")\n", "\n", "with open(file_path, \"rb\") as f:\n", - " response = http.request(\"PUT\", upload_response.upload_url, body=f, headers={\"Content-Type\": \"application/pdf\", \"Content-Length\": str(os.path.getsize(file_path))})\n", + " response = http.request(\"PUT\", upload_response.upload_url, body=f, headers={\"Content-Type\": content_type, \"Content-Length\": str(os.path.getsize(file_path))})\n", "if response.status != 200:\n", " print(\"Upload failed: \", response.data)\n", "else:\n", @@ -547,12 +548,10 @@ { "cell_type": "code", "source": [ - "from pathlib import Path\n", "import urllib3, os\n", "\n", "files_api = v.FilesApi(api)\n", "\n", - "content_type=\"application/pdf\"\n", "file_path=\"apple.pdf\"\n", "\n", "start_file_upload_response = files_api.start_file_upload(org, start_file_upload_request=v.StartFileUploadRequest(\n",