diff --git a/align_data/embeddings/embedding_utils.py b/align_data/embeddings/embedding_utils.py index ff38632..21adf61 100644 --- a/align_data/embeddings/embedding_utils.py +++ b/align_data/embeddings/embedding_utils.py @@ -105,6 +105,7 @@ def moderation_check(texts: List[str], max_texts_num: int = 32) -> List[Moderati @handle_openai_errors def _single_batch_compute_openai_embeddings(batch: List[str], **kwargs) -> List[List[float]]: """Compute embeddings for a batch.""" + print('emebedding', batch[0][:10], 'of len', len(batch)) batch_data = openai.Embedding.create(input=batch, engine=OPENAI_EMBEDDINGS_MODEL, **kwargs).data return [d["embedding"] for d in batch_data]