Movatterモバイル変換


[0]ホーム

URL:


Skip to content

Navigation Menu

Sign in
Appearance settings

Search code, repositories, users, issues, pull requests...

Provide feedback

We read every piece of feedback, and take your input very seriously.

Saved searches

Use saved searches to filter your results more quickly

Sign up
Appearance settings

Commit44d135b

Browse files
Dan v2 updates (#1491)
1 parent8089223 commit44d135b

File tree

14 files changed

+383
-39
lines changed

14 files changed

+383
-39
lines changed

‎pgml-cms/docs/product/cloud-database/serverless.md

Lines changed: 6 additions & 31 deletions
Original file line numberDiff line numberDiff line change
@@ -19,39 +19,14 @@ Once logged in, select "New Database" from the left menu and choose the Serverle
1919
###Serverless Pricing
2020
Storage is charged per GB/mo, and all requests by CPU or GPU millisecond of compute required to perform them.
2121

22-
####Vector & Relational Database
23-
| NAME| PRICING|
24-
| :---| ---:|
25-
| Tables & Index Storage| $0.20 GB per month|
26-
| Retrieval, Filtering, Ranking & other Queries| $7.50 per hour|
27-
| Embeddings| Included w/ Queries|
28-
| LLMs| Included w/ Queries|
29-
| Fine Tuning| Included w/ Queries|
30-
| Machine Learning| Included w/ Queries|
31-
22+
<turbo-frameid="serverless-pricing-turboframe"src="/dashboard/serverless_pricing/turboframe?style=marketing">
23+
Loading our current pricing model...
24+
</turbo-frame>
3225

3326
###Serverless Models
3427

3528
Serverless AI engines come with predefined models and a flexible pricing structure
3629

37-
####Embedding Models
38-
| NAME| PARAMETERS (M)| MAX INPUT TOKENS| DIMENSIONS| STRENGTHS|
39-
| ---| ---| ---| ---| ---|
40-
| intfloat/e5-large-v2| 33.4| 512| 384| High quality, low latency|
41-
| mixedbread-ai/mxbai-embed-large-v1| 334| 512| 1024| High quality, higher latency|
42-
| Alibaba-NLP/gte-base-en-v1.5| 137| 8192| 768| Supports up to 8k input tokens, low latency|
43-
| Alibaba-NLP/gte-large-en-v1.5| 434| 8192| 1024| Supports up to 8k input tokens, higher latency|
44-
45-
####Instruct Models
46-
| NAME| TOTAL PARAMETERS (M)| ACTIVE PARAMETERS (M)| CONTEXT SIZE| STRENGTHS|
47-
| ---| ---| ---| ---| ---|
48-
| meta-llama/Meta-Llama-3-70B-Instruct| 70,000| 70,000| 8,000| High quality|
49-
| meta-llama/Meta-Llama-3-8B-Instruct| 8,000| 8,000| 8,000| High quality, low latency|
50-
| microsoft/Phi-3-mini-128k-instruct| 3,820| 3,820| 128,000| Lowest latency|
51-
| mistralai/Mixtral-8x7B-Instruct-v0.1| 56,000| 12,900| 32,768| MOE high quality|
52-
| mistralai/Mistral-7B-Instruct-v0.2| 7,000| 7,000| 32,768| High quality, low latency|
53-
54-
####Summarization Models
55-
| NAME| PARAMETERS (M)| CONTEXT SIZE| STRENGTHS|
56-
| ---| ---| ---| ---|
57-
| google/pegasus-xsum| 568| 512| Efficient summarization|
30+
<turbo-frameid="serverless-models-turboframe"src="/dashboard/serverless_models/turboframe?style=marketing">
31+
Loading our current serverless models offered...
32+
</turbo-frame>

‎pgml-dashboard/Cargo.lock

Lines changed: 86 additions & 7 deletions
Some generated files are not rendered by default. Learn more aboutcustomizing how changed files appear on GitHub.

‎pgml-dashboard/src/components/tables/mod.rs

Lines changed: 8 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -4,5 +4,13 @@
44
// src/components/tables/large
55
pubmod large;
66

7+
// src/components/tables/serverless_models
8+
pubmod serverless_models;
9+
pubuse serverless_models::ServerlessModels;
10+
11+
// src/components/tables/serverless_pricing
12+
pubmod serverless_pricing;
13+
pubuse serverless_pricing::ServerlessPricing;
14+
715
// src/components/tables/small
816
pubmod small;
Lines changed: 114 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,114 @@
1+
usecrate::components::tables::small::row::Row;
2+
use pgml_components::component;
3+
use pgml_components::Component;
4+
use sailfish::TemplateOnce;
5+
6+
#[derive(TemplateOnce,Default)]
7+
#[template(path ="tables/serverless_models/template.html")]
8+
pubstructServerlessModels{
9+
style_type:String,
10+
embedding_models:[Component;4],
11+
instruct_models:[Component;5],
12+
summarization_models:[Component;1],
13+
}
14+
15+
implServerlessModels{
16+
pubfnnew() ->ServerlessModels{
17+
ServerlessModels{
18+
style_type:"product".to_string(),
19+
embedding_models:[
20+
Component::from(Row::new(&[
21+
"intfloat/e5-small-v2".into(),
22+
"33.4".into(),
23+
"512".into(),
24+
"384".into(),
25+
"Good quality, low latency".into(),
26+
])),
27+
Component::from(Row::new(&[
28+
"mixedbread-ai/mxbai-embed-large-v1".into(),
29+
"335".into(),
30+
"512".into(),
31+
"1024".into(),
32+
"High quality, higher latency".into(),
33+
])),
34+
Component::from(Row::new(&[
35+
"Alibaba-NLP/gte-base-en-v1.5".into(),
36+
"137".into(),
37+
"8192".into(),
38+
"768".into(),
39+
"Supports up to 8,000 input tokens".into(),
40+
])),
41+
Component::from(Row::new(&[
42+
"Alibaba-NLP/gte-large-en-v1.5".into(),
43+
"434".into(),
44+
"8192".into(),
45+
"1024".into(),
46+
"Highest quality, 8,000 input tokens".into(),
47+
])),
48+
],
49+
instruct_models:[
50+
Component::from(Row::new(&[
51+
"meta-llama/Meta-Llama-3-70B-Instruct".into(),
52+
"70,000".into(),
53+
"70,000".into(),
54+
"8,000".into(),
55+
"Highest quality".into(),
56+
])),
57+
Component::from(Row::new(&[
58+
"meta-llama/Meta-Llama-3-8B-Instruct".into(),
59+
"8,000".into(),
60+
"8,000".into(),
61+
"8,000".into(),
62+
"High quality, low latency".into(),
63+
])),
64+
Component::from(Row::new(&[
65+
"microsoft/Phi-3-mini-128k-instruct".into(),
66+
"3,820".into(),
67+
"3,820".into(),
68+
"128,000".into(),
69+
"Lowest latency".into(),
70+
])),
71+
Component::from(Row::new(&[
72+
"mistralai/Mixtral-8x7B-Instruct-v0.1".into(),
73+
"56,000".into(),
74+
"12,900".into(),
75+
"32,768".into(),
76+
"MOE high quality".into(),
77+
])),
78+
Component::from(Row::new(&[
79+
"mistralai/Mistral-7B-Instruct-v0.2".into(),
80+
"7,000".into(),
81+
"7,000".into(),
82+
"32,768".into(),
83+
"High quality, low latency".into(),
84+
])),
85+
],
86+
summarization_models:[Component::from(Row::new(&[
87+
"google/pegasus-xsum".into(),
88+
"568".into(),
89+
"512".into(),
90+
"8,000".into(),
91+
]))],
92+
}
93+
}
94+
95+
pubfnset_style_type(mutself,style_type:&str) ->Self{
96+
self.style_type = style_type.to_string();
97+
self
98+
}
99+
}
100+
101+
#[derive(TemplateOnce,Default)]
102+
#[template(path ="tables/serverless_models/turbotemplate.html")]
103+
pubstructServerlessModelsTurbo{
104+
comp:Component,
105+
}
106+
107+
implServerlessModelsTurbo{
108+
pubfnnew(comp:Component) ->ServerlessModelsTurbo{
109+
ServerlessModelsTurbo{ comp}
110+
}
111+
}
112+
113+
component!(ServerlessModels);
114+
component!(ServerlessModelsTurbo);
Lines changed: 7 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,7 @@
1+
div[data-controller="tables-serverless-models"] {
2+
table.table.table-smtheadth,table.table-smtheadth {
3+
vertical-align:top;
4+
padding-top:8px;
5+
padding-bottom:8px;
6+
}
7+
}

0 commit comments

Comments
 (0)

[8]ページ先頭

©2009-2025 Movatter.jp