1414SPLIT_SCHEMA_ID = "cko8sbczn0002h2dkdaxb5kal"
1515TRAIN_SPLIT_ID = "cko8sbscr0003h2dk04w86hof"
1616TEST_SPLIT_ID = "cko8scbz70005h2dkastwhgqt"
17- EMBEDDING_SCHEMA_ID = "ckpyije740000yxdk81pbgjdc"
1817TEXT_SCHEMA_ID = "cko8s9r5v0001h2dk9elqdidh"
1918CAPTURE_DT_SCHEMA_ID = "cko8sdzv70006h2dk8jg64zvb"
20- PRE_COMPUTED_EMBEDDINGS_ID = 'ckrzang79000008l6hb5s6za1'
2119CUSTOM_TEXT_SCHEMA_NAME = 'custom_text'
2220
2321FAKE_NUMBER_FIELD = {
@@ -56,7 +54,6 @@ def big_dataset(dataset: Dataset, image_url):
5654
5755
5856def make_metadata (dr_id ) -> DataRowMetadata :
59- embeddings = [0.0 ] * 128
6057 msg = "A message"
6158 time = datetime .utcnow ()
6259
@@ -67,14 +64,11 @@ def make_metadata(dr_id) -> DataRowMetadata:
6764 value = TEST_SPLIT_ID ),
6865 DataRowMetadataField (schema_id = CAPTURE_DT_SCHEMA_ID , value = time ),
6966 DataRowMetadataField (schema_id = TEXT_SCHEMA_ID , value = msg ),
70- DataRowMetadataField (schema_id = EMBEDDING_SCHEMA_ID ,
71- value = embeddings ),
7267 ])
7368 return metadata
7469
7570
7671def make_named_metadata (dr_id ) -> DataRowMetadata :
77- embeddings = [0.0 ] * 128
7872 msg = "A message"
7973 time = datetime .utcnow ()
8074
@@ -86,8 +80,6 @@ def make_named_metadata(dr_id) -> DataRowMetadata:
8680 value = time ),
8781 DataRowMetadataField (
8882 name = CUSTOM_TEXT_SCHEMA_NAME , value = msg ),
89- DataRowMetadataField (name = 'embedding' ,
90- value = embeddings ),
9183 ])
9284 return metadata
9385
@@ -127,10 +119,7 @@ def test_bulk_upsert_datarow_metadata(datarow, mdo: DataRowMetadataOntology):
127119 mdo .bulk_upsert ([metadata ])
128120 exported = mdo .bulk_export ([datarow .uid ])
129121 assert len (exported )
130- assert len ([
131- field for field in exported [0 ].fields
132- if field .schema_id != PRE_COMPUTED_EMBEDDINGS_ID
133- ]) == 4
122+ assert len ([field for field in exported [0 ].fields ]) == 3
134123
135124
136125@pytest .mark .slow
@@ -147,10 +136,8 @@ def test_large_bulk_upsert_datarow_metadata(big_dataset, mdo):
147136 for metadata in mdo .bulk_export (data_row_ids )
148137 }
149138 for data_row_id in data_row_ids :
150- assert len ([
151- f for f in metadata_lookup .get (data_row_id ).fields
152- if f .schema_id != PRE_COMPUTED_EMBEDDINGS_ID
153- ]), metadata_lookup .get (data_row_id ).fields
139+ assert len ([f for f in metadata_lookup .get (data_row_id ).fields
140+ ]), metadata_lookup .get (data_row_id ).fields
154141
155142
156143def test_upsert_datarow_metadata_by_name (datarow , mdo ):
@@ -162,10 +149,8 @@ def test_upsert_datarow_metadata_by_name(datarow, mdo):
162149 metadata .data_row_id : metadata
163150 for metadata in mdo .bulk_export ([datarow .uid ])
164151 }
165- assert len ([
166- f for f in metadata_lookup .get (datarow .uid ).fields
167- if f .schema_id != PRE_COMPUTED_EMBEDDINGS_ID
168- ]), metadata_lookup .get (datarow .uid ).fields
152+ assert len ([f for f in metadata_lookup .get (datarow .uid ).fields
153+ ]), metadata_lookup .get (datarow .uid ).fields
169154
170155
171156def test_upsert_datarow_metadata_option_by_name (datarow , mdo ):
@@ -220,10 +205,7 @@ def test_bulk_partial_delete_datarow_metadata(datarow, mdo):
220205 mdo .bulk_delete ([
221206 DeleteDataRowMetadata (data_row_id = datarow .uid , fields = [TEXT_SCHEMA_ID ])
222207 ])
223- fields = [
224- f for f in mdo .bulk_export ([datarow .uid ])[0 ].fields
225- if f .schema_id != PRE_COMPUTED_EMBEDDINGS_ID
226- ]
208+ fields = [f for f in mdo .bulk_export ([datarow .uid ])[0 ].fields ]
227209 assert len (fields ) == (len (metadata .fields ) - 1 )
228210
229211
@@ -234,9 +216,8 @@ def test_large_bulk_delete_datarow_metadata(big_dataset, mdo):
234216 metadata .append (
235217 DataRowMetadata (data_row_id = data_row_id ,
236218 fields = [
237- DataRowMetadataField (
238- schema_id = EMBEDDING_SCHEMA_ID ,
239- value = [0.1 ] * 128 ),
219+ DataRowMetadataField (schema_id = SPLIT_SCHEMA_ID ,
220+ value = TEST_SPLIT_ID ),
240221 DataRowMetadataField (schema_id = TEXT_SCHEMA_ID ,
241222 value = "test-message" )
242223 ]))
@@ -248,19 +229,13 @@ def test_large_bulk_delete_datarow_metadata(big_dataset, mdo):
248229 deletes .append (
249230 DeleteDataRowMetadata (
250231 data_row_id = data_row_id ,
251- fields = [
252- EMBEDDING_SCHEMA_ID , #
253- CAPTURE_DT_SCHEMA_ID
254- ]))
232+ fields = [SPLIT_SCHEMA_ID , CAPTURE_DT_SCHEMA_ID ]))
255233 errors = mdo .bulk_delete (deletes )
256234 assert len (errors ) == 0
257235 for data_row_id in data_row_ids :
258- fields = [
259- f for f in mdo .bulk_export ([data_row_id ])[0 ].fields
260- if f .schema_id != PRE_COMPUTED_EMBEDDINGS_ID
261- ]
236+ fields = [f for f in mdo .bulk_export ([data_row_id ])[0 ].fields ]
262237 assert len (fields ) == 1 , fields
263- assert EMBEDDING_SCHEMA_ID not in [field .schema_id for field in fields ]
238+ assert SPLIT_SCHEMA_ID not in [field .schema_id for field in fields ]
264239
265240
266241def test_bulk_delete_datarow_enum_metadata (datarow : DataRow , mdo ):
@@ -280,8 +255,7 @@ def test_bulk_delete_datarow_enum_metadata(datarow: DataRow, mdo):
280255 DeleteDataRowMetadata (data_row_id = datarow .uid , fields = [SPLIT_SCHEMA_ID ])
281256 ])
282257 exported = mdo .bulk_export ([datarow .uid ])[0 ].fields
283- assert len (
284- [f for f in exported if f .schema_id != PRE_COMPUTED_EMBEDDINGS_ID ]) == 0
258+ assert len (exported ) == 0
285259
286260
287261def test_raise_enum_upsert_schema_error (datarow , mdo ):
@@ -309,11 +283,10 @@ def test_upsert_non_existent_schema_id(datarow, mdo):
309283
310284
311285def test_delete_non_existent_schema_id (datarow , mdo ):
312- mdo .bulk_delete ([
313- DeleteDataRowMetadata (data_row_id = datarow .uid ,
314- fields = [EMBEDDING_SCHEMA_ID ])
286+ res = mdo .bulk_delete ([
287+ DeleteDataRowMetadata (data_row_id = datarow .uid , fields = [SPLIT_SCHEMA_ID ])
315288 ])
316- # No message is returned
289+ assert len ( res ) == 0
317290
318291
319292def test_parse_raw_metadata (mdo ):
0 commit comments