Skip to content

Commit 41bbe84

Browse files
committed
system test
1 parent 8c9f6ac commit 41bbe84

File tree

2 files changed

+66
-0
lines changed

2 files changed

+66
-0
lines changed

bigframes/bigquery/ml.py

Lines changed: 2 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -23,6 +23,7 @@
2323
create_model,
2424
evaluate,
2525
explain_predict,
26+
generate_embedding,
2627
generate_text,
2728
global_explain,
2829
predict,
@@ -37,4 +38,5 @@
3738
"global_explain",
3839
"transform",
3940
"generate_text",
41+
"generate_embedding",
4042
]
Lines changed: 64 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,64 @@
1+
# Copyright 2024 Google LLC
2+
#
3+
# Licensed under the Apache License, Version 2.0 (the "License");
4+
# you may not use this file except in compliance with the License.
5+
# You may obtain a copy of the License at
6+
#
7+
# http://www.apache.org/licenses/LICENSE-2.0
8+
#
9+
# Unless required by applicable law or agreed to in writing, software
10+
# distributed under the License is distributed on an "AS IS" BASIS,
11+
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12+
# See the License for the specific language governing permissions and
13+
# limitations under the License.
14+
15+
import pytest
16+
17+
import bigframes.bigquery.ml as ml
18+
import bigframes.pandas as bpd
19+
20+
21+
@pytest.fixture(scope="session")
22+
def embedding_model(bq_connection, dataset_id):
23+
model_name = f"{dataset_id}.embedding_model"
24+
return ml.create_model(
25+
model_name=model_name,
26+
options={"endpoint": "gemini-embedding-001"},
27+
connection_name=bq_connection,
28+
)
29+
30+
31+
def test_generate_embedding(embedding_model):
32+
df = bpd.DataFrame(
33+
{
34+
"content": [
35+
"What is BigQuery?",
36+
"What is BQML?",
37+
]
38+
}
39+
)
40+
41+
result = ml.generate_embedding(embedding_model, df)
42+
assert len(result) == 2
43+
assert "ml_generate_embedding_result" in result.columns
44+
assert "ml_generate_embedding_status" in result.columns
45+
46+
47+
def test_generate_embedding_with_options(embedding_model):
48+
df = bpd.DataFrame(
49+
{
50+
"content": [
51+
"What is BigQuery?",
52+
"What is BQML?",
53+
]
54+
}
55+
)
56+
57+
result = ml.generate_embedding(
58+
embedding_model, df, task_type="RETRIEVAL_DOCUMENT", output_dimensionality=256
59+
)
60+
assert len(result) == 2
61+
assert "ml_generate_embedding_result" in result.columns
62+
assert "ml_generate_embedding_status" in result.columns
63+
embedding = result["ml_generate_embedding_result"].to_pandas()
64+
assert len(embedding[0]) == 256

0 commit comments

Comments
 (0)