Overview

Provider Type

Trial Credits

API Endpoint


                                                        https://api.cortex.cerebrium.ai/v4

Free Tier Highlights

Pay-per-second compute

Quick Start Guide

1

Visit https://www.cerebrium.ai/

2

Sign up for free account

3

Receive $30 free credits

4

Install cerebrium CLI: pip install cerebrium

5

Deploy model with cerebrium deploy

6

Access via generated API endpoint

Available Models

Model Name	ID	Context	Capabilities
Any HuggingFace Model	`custom-deployment`	Model-dependent	-
Llama 3.1 (Deployable)	`meta-llama/Llama-3.1-8B-Instruct`	128 000	-

Integration Examples

Ready-to-use code snippets for your applications.

Select a Model

Select Model

main.py

# Install: pip install cerebrium
from cerebrium import get_secret

# Cerebrium uses Python-native deployments
# main.py (deployed to Cerebrium)
from vllm import LLM, SamplingParams

llm = LLM(model="meta-llama/Llama-3.1-8B-Instruct")

def predict(prompt: str):
    params = SamplingParams(temperature=0.7, max_tokens=512)
    output = llm.generate([prompt], params)
    return {"response": output[0].outputs[0].text}

# Deploy: cerebrium deploy my-llm

index.js

// Call your deployed Cerebrium model
const response = await fetch('https://api.cortex.cerebrium.ai/v4/YOUR_APP/predict', {
  method: 'POST',
  headers: {
    'Authorization': 'Bearer YOUR_CEREBRIUM_KEY',
    'Content-Type': 'application/json'
  },
  body: JSON.stringify({
    prompt: 'Explain serverless GPU computing'
  })
});

const data = await response.json();
console.log(data.response);

terminal

curl https://api.cortex.cerebrium.ai/v4/YOUR_APP/predict \
  -H "Authorization: Bearer YOUR_CEREBRIUM_KEY" \
  -H "Content-Type: application/json" \
  -d '{
    "prompt": "Explain serverless GPU computing"
  }'

example.php

<?php
$apiKey = 'YOUR_API_KEY';
$url = "https://api.cortex.cerebrium.ai/v4/models/custom-deployment:generateContent?key=$apiKey";

$data = [
    "contents" => [
        ["parts" => [["text" => "Explain quantum mechanics"]]]
    ]
];

$ch = curl_init($url);
curl_setopt($ch, CURLOPT_RETURNTRANSFER, true);
curl_setopt($ch, CURLOPT_POST, true);
curl_setopt($ch, CURLOPT_POSTFIELDS, json_encode($data));
curl_setopt($ch, CURLOPT_HTTPHEADER, ['Content-Type: application/json']);

$response = curl_exec($ch);
curl_close($ch);

echo $response;
?>

main.go

package main

import (
    "context"
    "fmt"
    "log"
    "github.com/google/generative-ai-go/genai"
    "google.golang.org/api/option"
)

func main() {
    ctx := context.Background()
    client, err := genai.NewClient(ctx, option.WithAPIKey("YOUR_API_KEY"))
    if err != nil { log.Fatal(err) }
    defer client.Close()

    model := client.GenerativeModel("custom-deployment")
    resp, err := model.GenerateContent(ctx, genai.Text("Explain quantum mechanics"))
    if err != nil { log.Fatal(err) }
    
    // ...
}

main.py

# Install: pip install cerebrium
from cerebrium import get_secret

# Cerebrium uses Python-native deployments
# main.py (deployed to Cerebrium)
from vllm import LLM, SamplingParams

llm = LLM(model="meta-llama/Llama-3.1-8B-Instruct")

def predict(prompt: str):
    params = SamplingParams(temperature=0.7, max_tokens=512)
    output = llm.generate([prompt], params)
    return {"response": output[0].outputs[0].text}

# Deploy: cerebrium deploy my-llm

index.js

// Call your deployed Cerebrium model
const response = await fetch('https://api.cortex.cerebrium.ai/v4/YOUR_APP/predict', {
  method: 'POST',
  headers: {
    'Authorization': 'Bearer YOUR_CEREBRIUM_KEY',
    'Content-Type': 'application/json'
  },
  body: JSON.stringify({
    prompt: 'Explain serverless GPU computing'
  })
});

const data = await response.json();
console.log(data.response);

terminal

curl https://api.cortex.cerebrium.ai/v4/YOUR_APP/predict \
  -H "Authorization: Bearer YOUR_CEREBRIUM_KEY" \
  -H "Content-Type: application/json" \
  -d '{
    "prompt": "Explain serverless GPU computing"
  }'

example.php

<?php
$apiKey = 'YOUR_API_KEY';
$url = "https://api.cortex.cerebrium.ai/v4/models/meta-llama/Llama-3.1-8B-Instruct:generateContent?key=$apiKey";

$data = [
    "contents" => [
        ["parts" => [["text" => "Explain quantum mechanics"]]]
    ]
];

$ch = curl_init($url);
curl_setopt($ch, CURLOPT_RETURNTRANSFER, true);
curl_setopt($ch, CURLOPT_POST, true);
curl_setopt($ch, CURLOPT_POSTFIELDS, json_encode($data));
curl_setopt($ch, CURLOPT_HTTPHEADER, ['Content-Type: application/json']);

$response = curl_exec($ch);
curl_close($ch);

echo $response;
?>

main.go

package main

import (
    "context"
    "fmt"
    "log"
    "github.com/google/generative-ai-go/genai"
    "google.golang.org/api/option"
)

func main() {
    ctx := context.Background()
    client, err := genai.NewClient(ctx, option.WithAPIKey("YOUR_API_KEY"))
    if err != nil { log.Fatal(err) }
    defer client.Close()

    model := client.GenerativeModel("meta-llama/Llama-3.1-8B-Instruct")
    resp, err := model.GenerateContent(ctx, genai.Text("Explain quantum mechanics"))
    if err != nil { log.Fatal(err) }
    
    // ...
}

Free Tier Pricing & Limits

Rate Limit

Requests per minute

Pay-per-second compute

Daily Quota

Requests per day

Credit-based

Token Limit

Tokens per minute

$30 free credits

Monthly Quota

Per month limit

One-time $30 credit

Free Credits

One-time

$30

Use Cases

Custom model deployment

Fine-tuned model hosting

Testing GPU-intensive models

Scaling AI prototypes

Custom inference pipelines

Limitations & Considerations

$30 is one-time trial credits

Requires some DevOps knowledge

Cold starts for serverless models

GPU costs can vary significantly

Credit card required for continued use

Community Hub

Live

Join the discussion, share tips, and rate Cerebrium.

Quick Reactions

Add Discussion

Display Name

Comment

Comments are moderated. Be helpful and respectful.

Recent Activity

0 comments

Cookie Consent

Cerebrium

Overview

Provider Type

API Endpoint

Free Tier Highlights

Why Choose Cerebrium?

Quick Start Guide

Visit https://www.cerebrium.ai/

Sign up for free account

Receive $30 free credits

Install cerebrium CLI: pip install cerebrium

Deploy model with cerebrium deploy

Access via generated API endpoint

Available Models

Integration Examples

Select Model

Free Tier Pricing & Limits

Rate Limit

Daily Quota

Token Limit

Monthly Quota

Free Credits

Use Cases

Limitations & Considerations

Community Hub

Quick Reactions

Add Discussion

Recent Activity

Ready to Get Started?

Cookie Consent

Cerebrium

Overview

Provider Type

API Endpoint

Free Tier Highlights

Why Choose Cerebrium?

Quick Start Guide

Visit https://www.cerebrium.ai/

Sign up for free account

Receive $30 free credits

Install cerebrium CLI: pip install cerebrium

Deploy model with cerebrium deploy

Access via generated API endpoint

Available Models

Integration Examples

Select Model

Free Tier Pricing & Limits

Rate Limit

Daily Quota

Token Limit

Monthly Quota

Free Credits

Use Cases

Limitations & Considerations

Community Hub

Quick Reactions

Add Discussion

Recent Activity

Suggest an Edit

Ready to Get Started?