Skip to content

Commit 44d135b

Browse files
Dan v2 updates (#1491)
1 parent 8089223 commit 44d135b

File tree

14 files changed

+383
-39
lines changed

14 files changed

+383
-39
lines changed

pgml-cms/docs/product/cloud-database/serverless.md

Lines changed: 6 additions & 31 deletions
Original file line numberDiff line numberDiff line change
@@ -19,39 +19,14 @@ Once logged in, select "New Database" from the left menu and choose the Serverle
1919
### Serverless Pricing
2020
Storage is charged per GB/mo, and all requests by CPU or GPU millisecond of compute required to perform them.
2121

22-
#### Vector & Relational Database
23-
| NAME | PRICING |
24-
| :--- | ---: |
25-
| Tables & Index Storage | $0.20 GB per month |
26-
| Retrieval, Filtering, Ranking & other Queries | $7.50 per hour |
27-
| Embeddings | Included w/ Queries |
28-
| LLMs | Included w/ Queries |
29-
| Fine Tuning | Included w/ Queries |
30-
| Machine Learning | Included w/ Queries |
31-
22+
<turbo-frame id="serverless-pricing-turboframe" src="/dashboard/serverless_pricing/turboframe?style=marketing">
23+
Loading our current pricing model...
24+
</turbo-frame>
3225

3326
### Serverless Models
3427

3528
Serverless AI engines come with predefined models and a flexible pricing structure
3629

37-
#### Embedding Models
38-
| NAME | PARAMETERS (M) | MAX INPUT TOKENS | DIMENSIONS | STRENGTHS |
39-
| --- | --- | --- | --- | --- |
40-
| intfloat/e5-large-v2 | 33.4 | 512 | 384 | High quality, low latency |
41-
| mixedbread-ai/mxbai-embed-large-v1 | 334 | 512 | 1024 | High quality, higher latency |
42-
| Alibaba-NLP/gte-base-en-v1.5 | 137 | 8192 | 768 | Supports up to 8k input tokens, low latency |
43-
| Alibaba-NLP/gte-large-en-v1.5 | 434 | 8192 | 1024 | Supports up to 8k input tokens, higher latency |
44-
45-
#### Instruct Models
46-
| NAME | TOTAL PARAMETERS (M) | ACTIVE PARAMETERS (M) | CONTEXT SIZE | STRENGTHS |
47-
| --- | --- | --- | --- | --- |
48-
| meta-llama/Meta-Llama-3-70B-Instruct | 70,000 | 70,000 | 8,000 | High quality |
49-
| meta-llama/Meta-Llama-3-8B-Instruct | 8,000 | 8,000 | 8,000 | High quality, low latency |
50-
| microsoft/Phi-3-mini-128k-instruct | 3,820 | 3,820 | 128,000 | Lowest latency |
51-
| mistralai/Mixtral-8x7B-Instruct-v0.1 | 56,000 | 12,900 | 32,768 | MOE high quality |
52-
| mistralai/Mistral-7B-Instruct-v0.2 | 7,000 | 7,000 | 32,768 | High quality, low latency |
53-
54-
#### Summarization Models
55-
| NAME | PARAMETERS (M) | CONTEXT SIZE | STRENGTHS |
56-
| --- | --- | --- | --- |
57-
| google/pegasus-xsum | 568 | 512 | Efficient summarization |
30+
<turbo-frame id="serverless-models-turboframe" src="/dashboard/serverless_models/turboframe?style=marketing">
31+
Loading our current serverless models offered...
32+
</turbo-frame>

pgml-dashboard/Cargo.lock

Lines changed: 86 additions & 7 deletions
Some generated files are not rendered by default. Learn more about customizing how changed files appear on GitHub.

pgml-dashboard/src/components/tables/mod.rs

Lines changed: 8 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -4,5 +4,13 @@
44
// src/components/tables/large
55
pub mod large;
66

7+
// src/components/tables/serverless_models
8+
pub mod serverless_models;
9+
pub use serverless_models::ServerlessModels;
10+
11+
// src/components/tables/serverless_pricing
12+
pub mod serverless_pricing;
13+
pub use serverless_pricing::ServerlessPricing;
14+
715
// src/components/tables/small
816
pub mod small;
Lines changed: 114 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,114 @@
1+
use crate::components::tables::small::row::Row;
2+
use pgml_components::component;
3+
use pgml_components::Component;
4+
use sailfish::TemplateOnce;
5+
6+
#[derive(TemplateOnce, Default)]
7+
#[template(path = "tables/serverless_models/template.html")]
8+
pub struct ServerlessModels {
9+
style_type: String,
10+
embedding_models: [Component; 4],
11+
instruct_models: [Component; 5],
12+
summarization_models: [Component; 1],
13+
}
14+
15+
impl ServerlessModels {
16+
pub fn new() -> ServerlessModels {
17+
ServerlessModels {
18+
style_type: "product".to_string(),
19+
embedding_models: [
20+
Component::from(Row::new(&[
21+
"intfloat/e5-small-v2".into(),
22+
"33.4".into(),
23+
"512".into(),
24+
"384".into(),
25+
"Good quality, low latency".into(),
26+
])),
27+
Component::from(Row::new(&[
28+
"mixedbread-ai/mxbai-embed-large-v1".into(),
29+
"335".into(),
30+
"512".into(),
31+
"1024".into(),
32+
"High quality, higher latency".into(),
33+
])),
34+
Component::from(Row::new(&[
35+
"Alibaba-NLP/gte-base-en-v1.5".into(),
36+
"137".into(),
37+
"8192".into(),
38+
"768".into(),
39+
"Supports up to 8,000 input tokens".into(),
40+
])),
41+
Component::from(Row::new(&[
42+
"Alibaba-NLP/gte-large-en-v1.5".into(),
43+
"434".into(),
44+
"8192".into(),
45+
"1024".into(),
46+
"Highest quality, 8,000 input tokens".into(),
47+
])),
48+
],
49+
instruct_models: [
50+
Component::from(Row::new(&[
51+
"meta-llama/Meta-Llama-3-70B-Instruct".into(),
52+
"70,000".into(),
53+
"70,000".into(),
54+
"8,000".into(),
55+
"Highest quality".into(),
56+
])),
57+
Component::from(Row::new(&[
58+
"meta-llama/Meta-Llama-3-8B-Instruct".into(),
59+
"8,000".into(),
60+
"8,000".into(),
61+
"8,000".into(),
62+
"High quality, low latency".into(),
63+
])),
64+
Component::from(Row::new(&[
65+
"microsoft/Phi-3-mini-128k-instruct".into(),
66+
"3,820".into(),
67+
"3,820".into(),
68+
"128,000".into(),
69+
"Lowest latency".into(),
70+
])),
71+
Component::from(Row::new(&[
72+
"mistralai/Mixtral-8x7B-Instruct-v0.1".into(),
73+
"56,000".into(),
74+
"12,900".into(),
75+
"32,768".into(),
76+
"MOE high quality".into(),
77+
])),
78+
Component::from(Row::new(&[
79+
"mistralai/Mistral-7B-Instruct-v0.2".into(),
80+
"7,000".into(),
81+
"7,000".into(),
82+
"32,768".into(),
83+
"High quality, low latency".into(),
84+
])),
85+
],
86+
summarization_models: [Component::from(Row::new(&[
87+
"google/pegasus-xsum".into(),
88+
"568".into(),
89+
"512".into(),
90+
"8,000".into(),
91+
]))],
92+
}
93+
}
94+
95+
pub fn set_style_type(mut self, style_type: &str) -> Self {
96+
self.style_type = style_type.to_string();
97+
self
98+
}
99+
}
100+
101+
#[derive(TemplateOnce, Default)]
102+
#[template(path = "tables/serverless_models/turbotemplate.html")]
103+
pub struct ServerlessModelsTurbo {
104+
comp: Component,
105+
}
106+
107+
impl ServerlessModelsTurbo {
108+
pub fn new(comp: Component) -> ServerlessModelsTurbo {
109+
ServerlessModelsTurbo { comp }
110+
}
111+
}
112+
113+
component!(ServerlessModels);
114+
component!(ServerlessModelsTurbo);
Lines changed: 7 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,7 @@
1+
div[data-controller="tables-serverless-models"] {
2+
table.table.table-sm thead th, table.table-sm thead th {
3+
vertical-align: top;
4+
padding-top: 8px;
5+
padding-bottom: 8px;
6+
}
7+
}

0 commit comments

Comments
 (0)