diff --git a/api.md b/api.md
index d037762..ab66b5d 100644
--- a/api.md
+++ b/api.md
@@ -1,193 +1,824 @@
-# Replicate
+# Replicate Python SDK API Reference
 
-Types:
+## Installation
+
+```bash
+pip install replicate
+```
+
+## Quick start
 
 ```python
-from replicate.types import SearchResponse
+import replicate
+
+# Create a model function for image generation
+banana = replicate.use("google/nano-banana")
+
+# Call it - returns an image URL
+image_url = banana(prompt="astronaut on a horse")
+print(image_url)  # https://replicate.delivery/...
+
+# Or for text generation
+claude = replicate.use("anthropic/claude-4-sonnet")
+text = claude(prompt="Write a haiku about Python")
+print(text)  # "Code flows like water..."
 ```
 
-Methods:
+## Client initialization
 
-- <code title="get /search">replicate.<a href="./src/replicate/_client.py">search</a>(\*\*<a href="src/replicate/types/client_search_params.py">params</a>) -> <a href="./src/replicate/types/search_response.py">SearchResponse</a></code>
+By default, the SDK uses the `REPLICATE_API_TOKEN` environment variable:
 
-# Collections
+```python
+import replicate
+
+# Uses REPLICATE_API_TOKEN from environment
+image_url = replicate.run("google/nano-banana", input={"prompt": "hello"})
+```
 
-Types:
+### Custom client configuration
+
+For advanced use cases, you can create an explicit client instance:
 
 ```python
-from replicate.types import CollectionListResponse, CollectionGetResponse
+from replicate import Replicate
+import os
+
+# Explicitly specify which environment variable to use
+replicate = Replicate(
+    bearer_token=os.environ.get("MY_REPLICATE_TOKEN"),
+    base_url="https://api.replicate.com/v1",  # Optional custom base URL
+    timeout=120.0,  # Request timeout in seconds
+    max_retries=5  # Maximum number of retries
+)
+
+# Now use this configured client
+image_url = replicate.run("google/nano-banana", input={"prompt": "hello"})
 ```
 
-Methods:
+### Asynchronous client
 
-- <code title="get /collections">replicate.collections.<a href="./src/replicate/resources/collections.py">list</a>() -> <a href="./src/replicate/types/collection_list_response.py">SyncCursorURLPage[CollectionListResponse]</a></code>
-- <code title="get /collections/{collection_slug}">replicate.collections.<a href="./src/replicate/resources/collections.py">get</a>(\*, collection_slug) -> <a href="./src/replicate/types/collection_get_response.py">CollectionGetResponse</a></code>
+```python
+from replicate import AsyncReplicate
+import asyncio
+import os
+
+async def main():
+    # Can specify token explicitly if needed
+    replicate = AsyncReplicate(bearer_token=os.environ.get("MY_REPLICATE_TOKEN"))
+    image_url = await replicate.run(
+        "google/nano-banana",
+        input={"prompt": "a watercolor painting"}
+    )
+    print(image_url)  # https://replicate.delivery/...
+
+asyncio.run(main())
+```
 
-# Deployments
+## High-level methods
 
-Types:
+### use() - Create a reusable model function (recommended)
+
+The most Pythonic way to interact with models. Creates a callable function for any model.
 
 ```python
-from replicate.types import (
-    DeploymentCreateResponse,
-    DeploymentUpdateResponse,
-    DeploymentListResponse,
-    DeploymentGetResponse,
+# Image generation - returns file URLs
+banana = replicate.use("google/nano-banana")
+
+# Simple call with just prompt (only required input)
+image_url = banana(prompt="a 19th century portrait of a wombat gentleman")
+print(image_url)  # Returns: https://replicate.delivery/...
+
+# Use it multiple times
+image1 = banana(prompt="a cat in a hat")
+image2 = banana(prompt="a dog in sunglasses")
+
+# Text generation - returns text string
+claude = replicate.use("anthropic/claude-4-sonnet")
+
+# Simple call with just prompt (only required input)
+text = claude(prompt="Write a haiku about Python programming")
+print(text)  # Returns: "Code flows like water..."
+
+# Enable streaming for text models
+claude_stream = replicate.use("anthropic/claude-4-sonnet", streaming=True)
+for chunk in claude_stream(prompt="Explain quantum computing"):
+    print(chunk, end="")  # Streams text chunks
+
+# Can accept model references in various formats
+model = replicate.use("owner/name:version")  # Specific version
+model = replicate.use("owner/name")  # Latest version
+model = replicate.use("5c7d5dc6dd8bf75c1acaa8565735e7986bc5b66206b55cca93cb72c9bf15ccaa")  # Version ID
+```
+
+### run() - Run a model once
+
+Direct method to run a model and get output. Good for one-off predictions.
+
+```python
+# Image generation - returns a file URL
+image_url = replicate.run(
+    "google/nano-banana",
+    input={"prompt": "a 19th century portrait of a wombat gentleman"}
 )
+print(image_url)  # https://replicate.delivery/...
+
+# Text generation - returns text string
+text = replicate.run(
+    "anthropic/claude-4-sonnet",
+    input={"prompt": "Write a poem about machine learning"}
+)
+print(text)  # "In silicon valleys deep and wide..."
+
+# Model reference formats
+replicate.run("owner/name:version", input={})  # Specific version
+replicate.run("owner/name", input={})  # Latest version
+replicate.run("5c7d5dc6dd8bf75c1acaa8565735e7986bc5b66206b55cca93cb72c9bf15ccaa", input={})  # Version ID
+```
+
+### stream() - Stream model output
+
+For models that support streaming (like language models). Returns an iterator of output chunks.
+
+```python
+# Stream text output (only for text models like Claude)
+for chunk in replicate.stream(
+    "anthropic/claude-4-sonnet",
+    input={"prompt": "Tell me a story about a robot"}
+):
+    print(chunk, end="")  # Prints each text chunk as it arrives
+
+# Async streaming
+async for chunk in async_replicate.stream(
+    "anthropic/claude-4-sonnet", 
+    input={"prompt": "Hello"}
+):
+    print(chunk, end="")
+```
+
+### search() - Search models
+
+Find models by keyword or description.
+
+```python
+# Search for models
+results = replicate.search(query="image generation", limit=10)
+
+for model in results:
+    print(f"{model.owner}/{model.name}: {model.description}")
 ```
 
-Methods:
+## Core resources
+
+### Predictions
 
-- <code title="post /deployments">replicate.deployments.<a href="./src/replicate/resources/deployments/deployments.py">create</a>(\*\*<a href="src/replicate/types/deployment_create_params.py">params</a>) -> <a href="./src/replicate/types/deployment_create_response.py">DeploymentCreateResponse</a></code>
-- <code title="patch /deployments/{deployment_owner}/{deployment_name}">replicate.deployments.<a href="./src/replicate/resources/deployments/deployments.py">update</a>(\*, deployment_owner, deployment_name, \*\*<a href="src/replicate/types/deployment_update_params.py">params</a>) -> <a href="./src/replicate/types/deployment_update_response.py">DeploymentUpdateResponse</a></code>
-- <code title="get /deployments">replicate.deployments.<a href="./src/replicate/resources/deployments/deployments.py">list</a>() -> <a href="./src/replicate/types/deployment_list_response.py">SyncCursorURLPage[DeploymentListResponse]</a></code>
-- <code title="delete /deployments/{deployment_owner}/{deployment_name}">replicate.deployments.<a href="./src/replicate/resources/deployments/deployments.py">delete</a>(\*, deployment_owner, deployment_name) -> None</code>
-- <code title="get /deployments/{deployment_owner}/{deployment_name}">replicate.deployments.<a href="./src/replicate/resources/deployments/deployments.py">get</a>(\*, deployment_owner, deployment_name) -> <a href="./src/replicate/types/deployment_get_response.py">DeploymentGetResponse</a></code>
+Create and manage model predictions.
 
-## Predictions
+```python
+from replicate.types import Prediction
+
+# Create a prediction
+prediction = replicate.predictions.create(
+    model="owner/model:version",
+    input={"prompt": "hello world"},
+    webhook="https://example.com/webhook",  # Optional webhook URL
+    webhook_events_filter=["start", "completed"]  # Optional webhook events
+)
+
+# Get prediction status
+prediction = replicate.predictions.get(prediction_id="abc123")
+print(f"Status: {prediction.status}")
+print(f"Output: {prediction.output}")
 
-Methods:
+# Cancel a prediction
+cancelled = replicate.predictions.cancel(prediction_id="abc123")
 
-- <code title="post /deployments/{deployment_owner}/{deployment_name}/predictions">replicate.deployments.predictions.<a href="./src/replicate/resources/deployments/predictions.py">create</a>(\*, deployment_owner, deployment_name, \*\*<a href="src/replicate/types/deployments/prediction_create_params.py">params</a>) -> <a href="./src/replicate/types/prediction.py">Prediction</a></code>
+# List predictions
+for prediction in replicate.predictions.list():
+    print(f"{prediction.id}: {prediction.status}")
+
+# Wait for a prediction to complete
+completed = replicate.predictions.wait(
+    prediction_id="abc123",
+    timeout=60  # Optional timeout in seconds
+)
+```
 
-# Hardware
+### Models
 
-Types:
+Interact with models and their versions.
 
 ```python
-from replicate.types import HardwareListResponse
+# Get a specific model
+model = replicate.models.get(model_owner="google", model_name="nano-banana")
+print(f"Model: {model.owner}/{model.name}")
+print(f"Description: {model.description}")
+print(f"Latest version: {model.latest_version.id}")
+
+# List all models (with pagination)
+for model in replicate.models.list():
+    print(f"{model.owner}/{model.name}")
+
+# Search models
+for model in replicate.models.search(query="text generation"):
+    print(f"{model.owner}/{model.name}: {model.description}")
+
+# Create a new model
+model = replicate.models.create(
+    owner="your-username",
+    name="my-model",
+    visibility="public",  # or "private"
+    hardware="gpu-t4",  # Specify hardware requirements
+    description="My custom model",
+    github_url="https://github.com/user/repo"
+)
+
+# Delete a model
+replicate.models.delete(model_owner="your-username", model_name="my-model")
 ```
 
-Methods:
+#### Model versions
 
-- <code title="get /hardware">replicate.hardware.<a href="./src/replicate/resources/hardware.py">list</a>() -> <a href="./src/replicate/types/hardware_list_response.py">HardwareListResponse</a></code>
+```python
+# List model versions
+for version in replicate.models.versions.list(
+    model_owner="google",
+    model_name="nano-banana"
+):
+    print(f"Version {version.id}: created at {version.created_at}")
+
+# Get a specific version
+version = replicate.models.versions.get(
+    model_owner="google",
+    model_name="nano-banana",
+    version_id="db21e45d3f7023abc2a46ee38a23973f6dce16bb082a930b0c49861f96d1e5bf"
+)
 
-# Account
+# Delete a version
+replicate.models.versions.delete(
+    model_owner="your-username",
+    model_name="my-model",
+    version_id="version-id"
+)
+```
+
+#### Model predictions
 
-Types:
+Run predictions directly through a model.
 
 ```python
-from replicate.types import AccountGetResponse
+# Create a prediction for a specific model
+prediction = replicate.models.predictions.create(
+    model_owner="google",
+    model_name="nano-banana",
+    input={"prompt": "a beautiful landscape"}
+)
+# prediction.output will be an image URL when complete
 ```
 
-Methods:
+#### Model examples
 
-- <code title="get /account">replicate.account.<a href="./src/replicate/resources/account.py">get</a>() -> <a href="./src/replicate/types/account_get_response.py">AccountGetResponse</a></code>
+```python
+# Get example predictions for a model
+for example in replicate.models.examples.list(
+    model_owner="google",
+    model_name="nano-banana"
+):
+    print(f"Example input: {example.input}")
+    print(f"Example output: {example.output}")
+```
 
-# Models
+### Deployments
 
-Types:
+Manage model deployments for production use.
 
 ```python
-from replicate.types import (
-    ModelCreateResponse,
-    ModelListResponse,
-    ModelGetResponse,
-    ModelSearchResponse,
+# Create a deployment
+deployment = replicate.deployments.create(
+    name="my-deployment",
+    model="owner/model:version",
+    hardware="gpu-a100-large",
+    min_instances=1,
+    max_instances=10
+)
+
+# List deployments
+for deployment in replicate.deployments.list():
+    print(f"{deployment.owner}/{deployment.name}")
+
+# Get deployment details
+deployment = replicate.deployments.get(
+    deployment_owner="your-username",
+    deployment_name="my-deployment"
+)
+
+# Update deployment
+updated = replicate.deployments.update(
+    deployment_owner="your-username",
+    deployment_name="my-deployment",
+    min_instances=2,
+    max_instances=20
 )
+
+# Delete deployment
+replicate.deployments.delete(
+    deployment_owner="your-username",
+    deployment_name="my-deployment"
+)
+
+# Run a prediction on a deployment
+prediction = replicate.deployments.predictions.create(
+    deployment_owner="your-username",
+    deployment_name="my-deployment",
+    input={"prompt": "hello world"}
+)
+```
+
+### Trainings
+
+Create and manage model training jobs.
+
+```python
+# Start a training job
+training = replicate.trainings.create(
+    model_owner="your-username",
+    model_name="my-model",
+    version_id="base-version-id",
+    input={
+        "train_data": "https://example.com/training-data.zip",
+        "epochs": 100,
+        "batch_size": 32
+    },
+    webhook="https://example.com/training-webhook"
+)
+
+# Get training status
+training = replicate.trainings.get(training_id="training-abc123")
+print(f"Status: {training.status}")
+
+# List trainings
+for training in replicate.trainings.list():
+    print(f"{training.id}: {training.status}")
+
+# Cancel a training
+cancelled = replicate.trainings.cancel(training_id="training-abc123")
+```
+
+### Collections
+
+Browse curated model collections.
+
+```python
+# List collections
+for collection in replicate.collections.list():
+    print(f"{collection.name}: {collection.description}")
+
+# Get a specific collection
+collection = replicate.collections.get(collection_slug="awesome-banana-models")
+for model in collection.models:
+    print(f"- {model.owner}/{model.name}")
+```
+
+### Files
+
+Upload and manage files for model inputs.
+
+```python
+# Create/upload a file
+with open("image.jpg", "rb") as f:
+    file_response = replicate.files.create(file=f)
+    file_url = file_response.urls.get
+
+# List files
+for file in replicate.files.list():
+    print(f"{file.id}: {file.name}")
+
+# Get file details
+file = replicate.files.get(file_id="file-abc123")
+print(f"File URL: {file.urls.get}")
+
+# Delete a file
+replicate.files.delete(file_id="file-abc123")
 ```
 
-Methods:
+### Hardware
 
-- <code title="post /models">replicate.models.<a href="./src/replicate/resources/models/models.py">create</a>(\*\*<a href="src/replicate/types/model_create_params.py">params</a>) -> <a href="./src/replicate/types/model_create_response.py">ModelCreateResponse</a></code>
-- <code title="get /models">replicate.models.<a href="./src/replicate/resources/models/models.py">list</a>() -> <a href="./src/replicate/types/model_list_response.py">SyncCursorURLPage[ModelListResponse]</a></code>
-- <code title="delete /models/{model_owner}/{model_name}">replicate.models.<a href="./src/replicate/resources/models/models.py">delete</a>(\*, model_owner, model_name) -> None</code>
-- <code title="get /models/{model_owner}/{model_name}">replicate.models.<a href="./src/replicate/resources/models/models.py">get</a>(\*, model_owner, model_name) -> <a href="./src/replicate/types/model_get_response.py">ModelGetResponse</a></code>
-- <code title="query /models">replicate.models.<a href="./src/replicate/resources/models/models.py">search</a>(\*\*<a href="src/replicate/types/model_search_params.py">params</a>) -> <a href="./src/replicate/types/model_search_response.py">SyncCursorURLPage[ModelSearchResponse]</a></code>
+Get information about available hardware.
 
-## Examples
+```python
+# List available hardware SKUs
+hardware_list = replicate.hardware.list()
+for sku in hardware_list:
+    print(f"{sku.name}: {sku.specs}")
+```
 
-Methods:
+### Account
 
-- <code title="get /models/{model_owner}/{model_name}/examples">replicate.models.examples.<a href="./src/replicate/resources/models/examples.py">list</a>(\*, model_owner, model_name) -> <a href="./src/replicate/types/prediction.py">SyncCursorURLPage[Prediction]</a></code>
+Manage account information.
 
-## Predictions
+```python
+# Get account details
+account = replicate.account.get()
+print(f"Username: {account.username}")
+print(f"Email: {account.email}")
+```
 
-Methods:
+### Webhooks
 
-- <code title="post /models/{model_owner}/{model_name}/predictions">replicate.models.predictions.<a href="./src/replicate/resources/models/predictions.py">create</a>(\*, model_owner, model_name, \*\*<a href="src/replicate/types/models/prediction_create_params.py">params</a>) -> <a href="./src/replicate/types/prediction.py">Prediction</a></code>
+Configure webhooks for predictions.
 
-## Readme
+```python
+# Get the default webhook secret
+webhook_secret = replicate.webhooks.default.secret.get()
+print(f"Webhook signing secret: {webhook_secret.key}")
+```
+
+## File handling
+
+### Input files
 
-Types:
+The SDK supports multiple ways to provide file inputs:
 
 ```python
-from replicate.types.models import ReadmeGetResponse
+# For models that accept image inputs (like Claude with vision)
+with open("input.jpg", "rb") as f:
+    text = replicate.run("anthropic/claude-4-sonnet", input={
+        "prompt": "What's in this image?",
+        "image": f
+    })
+
+# File path (automatically opened)
+text = replicate.run("anthropic/claude-4-sonnet", input={
+    "prompt": "Describe this",
+    "image": "path/to/image.jpg"
+})
+
+# URL
+text = replicate.run("anthropic/claude-4-sonnet", input={
+    "prompt": "Analyze this image",
+    "image": "https://example.com/image.jpg"
+})
 ```
 
-Methods:
+### Output files
 
-- <code title="get /models/{model_owner}/{model_name}/readme">replicate.models.readme.<a href="./src/replicate/resources/models/readme.py">get</a>(\*, model_owner, model_name) -> str</code>
+File outputs are automatically converted to `FileOutput` objects:
+
+```python
+from replicate.helpers import FileOutput
+
+# Image generation returns a file URL
+image_url = replicate.run("google/nano-banana", input={"prompt": "sunset over mountains"})
+print(f"Generated image: {image_url}")
+
+# Text generation returns a string
+text = replicate.run("anthropic/claude-4-sonnet", input={"prompt": "Tell me a joke"})
+print(f"Response: {text}")
+
+# When using FileOutput wrapper
+from replicate.helpers import FileOutput
+if isinstance(image_url, FileOutput):
+    # Get the URL
+    print(f"File URL: {image_url.url}")
+    
+    # Save to disk
+    with open("output.jpg", "wb") as f:
+        for chunk in image_url:
+            f.write(chunk)
+```
 
-## Versions
+## Error handling
 
-Types:
+The SDK provides detailed exception types for error handling:
 
 ```python
-from replicate.types.models import VersionListResponse, VersionGetResponse
+from replicate.exceptions import (
+    ReplicateError,
+    ModelError,
+    RateLimitError,
+    AuthenticationError,
+    NotFoundError
+)
+
+try:
+    image_url = replicate.run("google/nano-banana", input={"prompt": "test"})
+except ModelError as e:
+    # Model execution failed
+    print(f"Model error: {e}")
+    print(f"Prediction ID: {e.prediction.id}")
+    print(f"Prediction status: {e.prediction.status}")
+except RateLimitError as e:
+    # Rate limited
+    print("Rate limit exceeded, retry after:", e.response.headers.get("retry-after"))
+except AuthenticationError:
+    # Invalid API token
+    print("Invalid API token")
+except NotFoundError:
+    # Model not found
+    print("Model not found")
+except ReplicateError as e:
+    # Other Replicate API errors
+    print(f"API error: {e}")
 ```
 
-Methods:
+## Pagination
 
-- <code title="get /models/{model_owner}/{model_name}/versions">replicate.models.versions.<a href="./src/replicate/resources/models/versions.py">list</a>(\*, model_owner, model_name) -> <a href="./src/replicate/types/models/version_list_response.py">SyncCursorURLPage[VersionListResponse]</a></code>
-- <code title="delete /models/{model_owner}/{model_name}/versions/{version_id}">replicate.models.versions.<a href="./src/replicate/resources/models/versions.py">delete</a>(\*, model_owner, model_name, version_id) -> None</code>
-- <code title="get /models/{model_owner}/{model_name}/versions/{version_id}">replicate.models.versions.<a href="./src/replicate/resources/models/versions.py">get</a>(\*, model_owner, model_name, version_id) -> <a href="./src/replicate/types/models/version_get_response.py">VersionGetResponse</a></code>
+The SDK automatically handles pagination for list operations:
+
+```python
+# Automatic pagination (iterates through all pages)
+for model in replicate.models.list():
+    print(model.name)
 
-# Predictions
+# Manual pagination
+first_page = replicate.models.list()
+print(f"Items in first page: {len(first_page.items)}")
 
-Types:
+if first_page.has_next_page():
+    next_page = first_page.get_next_page()
+    print(f"Items in second page: {len(next_page.items)}")
+
+# Get all items at once
+all_models = list(replicate.models.list())
+```
+
+## Advanced features
+
+### Raw response access
+
+Access the underlying HTTP response:
+
+```python
+# Get raw response
+response = replicate.predictions.with_raw_response.create(
+    model="model:version",
+    input={"prompt": "test"}
+)
+
+# Access response data
+print(f"Status code: {response.status_code}")
+print(f"Headers: {response.headers}")
+
+# Parse the response
+prediction = response.parse()
+```
+
+### Custom HTTP client
+
+Configure a custom HTTP client for Replicate:
 
 ```python
-from replicate.types import Prediction, PredictionOutput, PredictionRequest
+import httpx
+from replicate import DefaultHttpxClient
+
+# With proxy
+replicate = Replicate(
+    http_client=DefaultHttpxClient(
+        proxy="http://proxy.example.com:8080"
+    )
+)
+
+# With custom timeout
+replicate = Replicate(
+    http_client=DefaultHttpxClient(
+        timeout=httpx.Timeout(60.0)
+    )
+)
 ```
 
-Methods:
+### Retries and timeouts
+
+Configure retry behavior and timeouts:
+
+```python
+replicate = Replicate(
+    max_retries=5,  # Maximum number of retries
+    timeout=120.0  # Request timeout in seconds
+)
 
-- <code title="post /predictions">replicate.predictions.<a href="./src/replicate/resources/predictions.py">create</a>(\*\*<a href="src/replicate/types/prediction_create_params.py">params</a>) -> <a href="./src/replicate/types/prediction.py">Prediction</a></code>
-- <code title="get /predictions">replicate.predictions.<a href="./src/replicate/resources/predictions.py">list</a>(\*\*<a href="src/replicate/types/prediction_list_params.py">params</a>) -> <a href="./src/replicate/types/prediction.py">SyncCursorURLPageWithCreatedFilters[Prediction]</a></code>
-- <code title="post /predictions/{prediction_id}/cancel">replicate.predictions.<a href="./src/replicate/resources/predictions.py">cancel</a>(\*, prediction_id) -> <a href="./src/replicate/types/prediction.py">Prediction</a></code>
-- <code title="get /predictions/{prediction_id}">replicate.predictions.<a href="./src/replicate/resources/predictions.py">get</a>(\*, prediction_id) -> <a href="./src/replicate/types/prediction.py">Prediction</a></code>
+# Per-request timeout
+image_url = replicate.run(
+    "google/nano-banana",
+    input={"prompt": "test"},
+    wait=60  # Wait up to 60 seconds for completion
+)
+```
 
-# Trainings
+### Client copying
 
-Types:
+Create a new Replicate instance with modified settings:
 
 ```python
-from replicate.types import (
-    TrainingCreateResponse,
-    TrainingListResponse,
-    TrainingCancelResponse,
-    TrainingGetResponse,
+# Create a copy with different settings
+new_replicate = replicate.copy(
+    bearer_token="different_token",
+    timeout=60.0,
+    max_retries=3
 )
 ```
 
-Methods:
+## Async/await support
+
+All methods have async equivalents when using `AsyncReplicate`:
+
+```python
+import asyncio
+from replicate import AsyncReplicate
+
+async def main():
+    replicate = AsyncReplicate()
+    
+    # Image generation
+    image_url = await replicate.run(
+        "google/nano-banana",
+        input={"prompt": "a futuristic city"}
+    )
+    print(f"Image: {image_url}")
+    
+    # Stream text generation
+    async for chunk in replicate.stream(
+        "anthropic/claude-4-sonnet",
+        input={"prompt": "Tell me a joke"}
+    ):
+        print(chunk, end="")
+    
+    # Pagination
+    async for model in replicate.models.list():
+        print(model.name)
+    
+    # Concurrent requests
+    tasks = [
+        replicate.run("google/nano-banana", input={"prompt": "cat"}),
+        replicate.run("google/nano-banana", input={"prompt": "dog"}),
+        replicate.run("anthropic/claude-4-sonnet", input={"prompt": "Hello"})
+    ]
+    results = await asyncio.gather(*tasks)
+
+asyncio.run(main())
+```
 
-- <code title="post /models/{model_owner}/{model_name}/versions/{version_id}/trainings">replicate.trainings.<a href="./src/replicate/resources/trainings.py">create</a>(\*, model_owner, model_name, version_id, \*\*<a href="src/replicate/types/training_create_params.py">params</a>) -> <a href="./src/replicate/types/training_create_response.py">TrainingCreateResponse</a></code>
-- <code title="get /trainings">replicate.trainings.<a href="./src/replicate/resources/trainings.py">list</a>() -> <a href="./src/replicate/types/training_list_response.py">SyncCursorURLPage[TrainingListResponse]</a></code>
-- <code title="post /trainings/{training_id}/cancel">replicate.trainings.<a href="./src/replicate/resources/trainings.py">cancel</a>(\*, training_id) -> <a href="./src/replicate/types/training_cancel_response.py">TrainingCancelResponse</a></code>
-- <code title="get /trainings/{training_id}">replicate.trainings.<a href="./src/replicate/resources/trainings.py">get</a>(\*, training_id) -> <a href="./src/replicate/types/training_get_response.py">TrainingGetResponse</a></code>
+## Environment variables
 
-# Webhooks
+The SDK respects these environment variables:
 
-## Default
+- `REPLICATE_API_TOKEN` - API authentication token
+- `REPLICATE_BASE_URL` - Override the API base URL (default: `https://api.replicate.com/v1`)
 
-### Secret
+## Type hints
 
-Types:
+The SDK is fully typed with comprehensive type hints:
 
 ```python
-from replicate.types.webhooks.default import SecretGetResponse
+import replicate
+from replicate.types import Prediction, PredictionStatus
+from replicate.pagination import SyncCursorURLPage
+
+# Type hints for responses
+prediction: Prediction = replicate.predictions.get(prediction_id="abc123")
+status: PredictionStatus = prediction.status
+
+# Type hints for pagination
+page: SyncCursorURLPage[Prediction] = replicate.predictions.list()
 ```
 
-Methods:
+## Common patterns
 
-- <code title="get /webhooks/default/secret">replicate.webhooks.default.secret.<a href="./src/replicate/resources/webhooks/default/secret.py">get</a>() -> <a href="./src/replicate/types/webhooks/default/secret_get_response.py">SecretGetResponse</a></code>
+### Wait for completion with polling
 
-# Files
+```python
+import time
+
+def wait_for_prediction(replicate, prediction_id, timeout=300):
+    """Poll a prediction until it completes or times out."""
+    start = time.time()
+    while time.time() - start < timeout:
+        prediction = replicate.predictions.get(prediction_id)
+        if prediction.status in ["succeeded", "failed", "canceled"]:
+            return prediction
+        time.sleep(2)  # Poll every 2 seconds
+    raise TimeoutError(f"Prediction {prediction_id} timed out")
+
+# Usage
+prediction = replicate.predictions.create(model="model:version", input={})
+result = wait_for_prediction(replicate, prediction.id)
+```
 
-Types:
+### Batch processing
 
 ```python
-from replicate.types import FileCreateResponse, FileListResponse, FileGetResponse
+import asyncio
+from replicate import AsyncReplicate
+
+async def batch_process(prompts):
+    """Process multiple prompts in parallel."""
+    from replicate import AsyncReplicate
+    replicate = AsyncReplicate()
+    tasks = [
+        replicate.run("model:version", input={"prompt": prompt})
+        for prompt in prompts
+    ]
+    return await asyncio.gather(*tasks)
+
+# Usage
+prompts = ["prompt 1", "prompt 2", "prompt 3"]
+results = asyncio.run(batch_process(prompts))
 ```
+
+### Webhook handling
+
+```python
+from flask import Flask, request
+import hmac
+import hashlib
+
+app = Flask(__name__)
+
+def verify_webhook(payload, signature, secret):
+    """Verify webhook signature."""
+    expected = hmac.new(
+        secret.encode(),
+        payload,
+        hashlib.sha256
+    ).hexdigest()
+    return hmac.compare_digest(expected, signature)
+
+@app.route("/webhook", methods=["POST"])
+def webhook():
+    # Get webhook secret
+    secret = "your_webhook_secret"  # From replicate.webhooks.default.secret.get()
+    
+    # Verify signature
+    signature = request.headers.get("X-Replicate-Signature")
+    if not verify_webhook(request.data, signature, secret):
+        return "Unauthorized", 401
+    
+    # Process prediction
+    data = request.json
+    print(f"Prediction {data['id']} status: {data['status']}")
+    
+    if data["status"] == "succeeded":
+        print(f"Output: {data['output']}")
+    
+    return "OK", 200
+```
+
+## Migration guide
+
+### From v0.x to v1.0+
+
+The new SDK uses a different API structure. Here's how to migrate:
+
+**Old (v0.x):**
+```python
+import replicate
+
+# Run a model - image generation returns URL
+image_url = replicate.run(
+    "google/nano-banana",
+    input={"prompt": "a cat"}
+)
+
+# Get a model
+model = replicate.models.get("google/nano-banana")
+```
+
+**New (v1.0+):**
+```python
+import replicate
+
+# Run a model - image generation returns URL
+image_url = replicate.run(
+    "google/nano-banana",
+    input={"prompt": "a cat"}
+)
+
+# Get a model
+model = replicate.models.get(
+    model_owner="google",
+    model_name="nano-banana"
+)
+```
+
+### Using legacy authentication
+
+For compatibility with older code:
+
+```python
+from replicate import Replicate
+
+# Old style (still supported)
+replicate = Replicate(api_token="your_token")
+
+# New style (recommended)
+replicate = Replicate(bearer_token="your_token")
+```
+
+## Support
+
+- **Documentation**: https://replicate.com/docs
+- **GitHub**: https://github.com/replicate/replicate-python
+- **Discord**: https://discord.gg/replicate
+- **API Reference**: https://replicate.com/docs/api
+
+## License
+
+Apache License 2.0
\ No newline at end of file
diff --git a/src/replicate/_client.py b/src/replicate/_client.py
index 390a552..237cd87 100644
--- a/src/replicate/_client.py
+++ b/src/replicate/_client.py
@@ -102,6 +102,7 @@ def __init__(
         self,
         *,
         bearer_token: str | None = None,
+        api_token: str | None = None,  # Legacy compatibility parameter
         base_url: str | httpx.URL | None = None,
         timeout: Union[float, Timeout, None, NotGiven] = NOT_GIVEN,
         max_retries: int = DEFAULT_MAX_RETRIES,
@@ -124,7 +125,17 @@ def __init__(
         """Construct a new synchronous Replicate client instance.
 
         This automatically infers the `bearer_token` argument from the `REPLICATE_API_TOKEN` environment variable if it is not provided.
+
+        For legacy compatibility, you can also pass `api_token` instead of `bearer_token`.
         """
+        # Handle legacy api_token parameter
+        if api_token is not None and bearer_token is not None:
+            raise ReplicateError(
+                "Cannot specify both 'bearer_token' and 'api_token'. Please use 'bearer_token' (recommended) or 'api_token' for legacy compatibility."
+            )
+        if api_token is not None:
+            bearer_token = api_token
+
         if bearer_token is None:
             bearer_token = _get_api_token_from_environment()
         if bearer_token is None:
@@ -477,6 +488,7 @@ def __init__(
         self,
         *,
         bearer_token: str | None = None,
+        api_token: str | None = None,  # Legacy compatibility parameter
         base_url: str | httpx.URL | None = None,
         timeout: Union[float, Timeout, None, NotGiven] = NOT_GIVEN,
         max_retries: int = DEFAULT_MAX_RETRIES,
@@ -499,7 +511,17 @@ def __init__(
         """Construct a new async AsyncReplicate client instance.
 
         This automatically infers the `bearer_token` argument from the `REPLICATE_API_TOKEN` environment variable if it is not provided.
+
+        For legacy compatibility, you can also pass `api_token` instead of `bearer_token`.
         """
+        # Handle legacy api_token parameter
+        if api_token is not None and bearer_token is not None:
+            raise ReplicateError(
+                "Cannot specify both 'bearer_token' and 'api_token'. Please use 'bearer_token' (recommended) or 'api_token' for legacy compatibility."
+            )
+        if api_token is not None:
+            bearer_token = api_token
+
         if bearer_token is None:
             bearer_token = _get_api_token_from_environment()
         if bearer_token is None:
diff --git a/tests/test_api_token_compatibility.py b/tests/test_api_token_compatibility.py
new file mode 100644
index 0000000..3d2ef51
--- /dev/null
+++ b/tests/test_api_token_compatibility.py
@@ -0,0 +1,89 @@
+"""Tests for api_token legacy compatibility during client instantiation."""
+
+from __future__ import annotations
+
+import os
+import pytest
+
+from replicate import Replicate, AsyncReplicate, ReplicateError
+from replicate._client import Client
+
+
+class TestApiTokenCompatibility:
+    """Test that api_token parameter works as a legacy compatibility option."""
+
+    def test_sync_client_with_api_token(self) -> None:
+        """Test that Replicate accepts api_token parameter."""
+        client = Replicate(api_token="test_token_123")
+        assert client.bearer_token == "test_token_123"
+
+    def test_async_client_with_api_token(self) -> None:
+        """Test that AsyncReplicate accepts api_token parameter."""
+        client = AsyncReplicate(api_token="test_token_123")
+        assert client.bearer_token == "test_token_123"
+
+    def test_sync_client_with_bearer_token(self) -> None:
+        """Test that Replicate still accepts bearer_token parameter."""
+        client = Replicate(bearer_token="test_token_123")
+        assert client.bearer_token == "test_token_123"
+
+    def test_async_client_with_bearer_token(self) -> None:
+        """Test that AsyncReplicate still accepts bearer_token parameter."""
+        client = AsyncReplicate(bearer_token="test_token_123")
+        assert client.bearer_token == "test_token_123"
+
+    def test_sync_client_both_tokens_error(self) -> None:
+        """Test that providing both api_token and bearer_token raises an error."""
+        with pytest.raises(ReplicateError, match="Cannot specify both 'bearer_token' and 'api_token'"):
+            Replicate(api_token="test_api", bearer_token="test_bearer")
+
+    def test_async_client_both_tokens_error(self) -> None:
+        """Test that providing both api_token and bearer_token raises an error."""
+        with pytest.raises(ReplicateError, match="Cannot specify both 'bearer_token' and 'api_token'"):
+            AsyncReplicate(api_token="test_api", bearer_token="test_bearer")
+
+    def test_sync_client_no_token_with_env(self, monkeypatch: pytest.MonkeyPatch) -> None:
+        """Test that client reads from environment when no token is provided."""
+        monkeypatch.setenv("REPLICATE_API_TOKEN", "env_token_123")
+        client = Replicate()
+        assert client.bearer_token == "env_token_123"
+
+    def test_async_client_no_token_with_env(self, monkeypatch: pytest.MonkeyPatch) -> None:
+        """Test that async client reads from environment when no token is provided."""
+        monkeypatch.setenv("REPLICATE_API_TOKEN", "env_token_123")
+        client = AsyncReplicate()
+        assert client.bearer_token == "env_token_123"
+
+    def test_sync_client_no_token_no_env(self, monkeypatch: pytest.MonkeyPatch) -> None:
+        """Test that client raises error when no token is provided and env is not set."""
+        monkeypatch.delenv("REPLICATE_API_TOKEN", raising=False)
+        with pytest.raises(ReplicateError, match="The bearer_token client option must be set"):
+            Replicate()
+
+    def test_async_client_no_token_no_env(self, monkeypatch: pytest.MonkeyPatch) -> None:
+        """Test that async client raises error when no token is provided and env is not set."""
+        monkeypatch.delenv("REPLICATE_API_TOKEN", raising=False)
+        with pytest.raises(ReplicateError, match="The bearer_token client option must be set"):
+            AsyncReplicate()
+
+    def test_legacy_client_alias(self) -> None:
+        """Test that legacy Client import still works as an alias."""
+        assert Client is Replicate
+
+    def test_legacy_client_with_api_token(self) -> None:
+        """Test that legacy Client alias works with api_token parameter."""
+        client = Client(api_token="test_token_123")
+        assert client.bearer_token == "test_token_123"
+        assert isinstance(client, Replicate)
+
+    def test_api_token_overrides_env(self, monkeypatch: pytest.MonkeyPatch) -> None:
+        """Test that explicit api_token overrides environment variable."""
+        monkeypatch.setenv("REPLICATE_API_TOKEN", "env_token")
+        client = Replicate(api_token="explicit_token")
+        assert client.bearer_token == "explicit_token"
+
+    def test_bearer_token_overrides_env(self, monkeypatch: pytest.MonkeyPatch) -> None:
+        """Test that explicit bearer_token overrides environment variable."""
+        monkeypatch.setenv("REPLICATE_API_TOKEN", "env_token")
+        client = Replicate(bearer_token="explicit_token")
+        assert client.bearer_token == "explicit_token"
\ No newline at end of file