Unable to used Hybrid queries when working with azure-openai embeddings. The query asks for an OPENAI key while the azureopenai key env is set in docker compose. The near_text query works fine though
weaviate_client_version : 4.10.2
weaviate_version: 1.28.1
Collection_definition:
_CollectionConfig(name='Kip_vid_documents_without_flevy_azure',
description=None,
generative_config=None,
inverted_index_config=_InvertedIndexConfig(bm25=_BM25Config(b=0.75,
k1=1.2),
cleanup_interval_seconds=60,
index_null_state=False,
index_property_length=False,
index_timestamps=False,
stopwords=_StopwordsConfig(preset=<StopwordsPreset.EN: 'en'>,
additions=None,
removals=None)),
multi_tenancy_config=_MultiTenancyConfig(enabled=False,
auto_tenant_creation=False,
auto_tenant_activation=False),
properties=[_Property(name='data',
description=None,
data_type=<DataType.TEXT: 'text'>,
index_filterable=True,
index_range_filters=False,
index_searchable=True,
nested_properties=None,
tokenization=<Tokenization.FIELD: 'field'>,
vectorizer_config=_PropertyVectorizerConfig(skip=False,
vectorize_property_name=False),
vectorizer='text2vec-openai'),
_Property(name='segment_id',
description=None,
data_type=<DataType.TEXT: 'text'>,
index_filterable=True,
index_range_filters=False,
index_searchable=True,
nested_properties=None,
tokenization=<Tokenization.WORD: 'word'>,
vectorizer_config=_PropertyVectorizerConfig(skip=False,
vectorize_property_name=False),
vectorizer='text2vec-openai'),
_Property(name='source_url',
description=None,
data_type=<DataType.TEXT: 'text'>,
index_filterable=True,
index_range_filters=False,
index_searchable=True,
nested_properties=None,
tokenization=<Tokenization.WORD: 'word'>,
vectorizer_config=_PropertyVectorizerConfig(skip=False,
vectorize_property_name=False),
vectorizer='text2vec-openai'),
_Property(name='source_name',
description=None,
data_type=<DataType.TEXT: 'text'>,
index_filterable=True,
index_range_filters=False,
index_searchable=True,
nested_properties=None,
tokenization=<Tokenization.WORD: 'word'>,
vectorizer_config=_PropertyVectorizerConfig(skip=False,
vectorize_property_name=False),
vectorizer='text2vec-openai'),
_Property(name='source_tag__metadata',
description=None,
data_type=<DataType.TEXT: 'text'>,
index_filterable=True,
index_range_filters=False,
index_searchable=True,
nested_properties=None,
tokenization=<Tokenization.FIELD: 'field'>,
vectorizer_config=_PropertyVectorizerConfig(skip=False,
vectorize_property_name=False),
vectorizer='text2vec-openai'),
_Property(name='source_id',
description=None,
data_type=<DataType.TEXT: 'text'>,
index_filterable=True,
index_range_filters=False,
index_searchable=True,
nested_properties=None,
tokenization=<Tokenization.WORD: 'word'>,
vectorizer_config=_PropertyVectorizerConfig(skip=False,
vectorize_property_name=False),
vectorizer='text2vec-openai'),
_Property(name='measurement_approach',
description=None,
data_type=<DataType.TEXT: 'text'>,
index_filterable=True,
index_range_filters=False,
index_searchable=True,
nested_properties=None,
tokenization=<Tokenization.WORD: 'word'>,
vectorizer_config=_PropertyVectorizerConfig(skip=False,
vectorize_property_name=False),
vectorizer='text2vec-openai'),
_Property(name='trend_analysis',
description=None,
data_type=<DataType.TEXT: 'text'>,
index_filterable=True,
index_range_filters=False,
index_searchable=True,
nested_properties=None,
tokenization=<Tokenization.WORD: 'word'>,
vectorizer_config=_PropertyVectorizerConfig(skip=False,
vectorize_property_name=False),
vectorizer='text2vec-openai'),
_Property(name='actionable_tips',
description=None,
data_type=<DataType.TEXT: 'text'>,
index_filterable=True,
index_range_filters=False,
index_searchable=True,
nested_properties=None,
tokenization=<Tokenization.WORD: 'word'>,
vectorizer_config=_PropertyVectorizerConfig(skip=False,
vectorize_property_name=False),
vectorizer='text2vec-openai'),
_Property(name='visualization_suggestions',
description=None,
data_type=<DataType.TEXT: 'text'>,
index_filterable=True,
index_range_filters=False,
index_searchable=True,
nested_properties=None,
tokenization=<Tokenization.WORD: 'word'>,
vectorizer_config=_PropertyVectorizerConfig(skip=False,
vectorize_property_name=False),
vectorizer='text2vec-openai'),
_Property(name='tools_technologies',
description=None,
data_type=<DataType.TEXT: 'text'>,
index_filterable=True,
index_range_filters=False,
index_searchable=True,
nested_properties=None,
tokenization=<Tokenization.WORD: 'word'>,
vectorizer_config=_PropertyVectorizerConfig(skip=False,
vectorize_property_name=False),
vectorizer='text2vec-openai'),
_Property(name='category',
description=None,
data_type=<DataType.TEXT: 'text'>,
index_filterable=True,
index_range_filters=False,
index_searchable=True,
nested_properties=None,
tokenization=<Tokenization.WORD: 'word'>,
vectorizer_config=_PropertyVectorizerConfig(skip=False,
vectorize_property_name=False),
vectorizer='text2vec-openai'),
_Property(name='definition',
description=None,
data_type=<DataType.TEXT: 'text'>,
index_filterable=True,
index_range_filters=False,
index_searchable=True,
nested_properties=None,
tokenization=<Tokenization.WORD: 'word'>,
vectorizer_config=_PropertyVectorizerConfig(skip=False,
vectorize_property_name=False),
vectorizer='text2vec-openai'),
_Property(name='standard_formula',
description=None,
data_type=<DataType.TEXT: 'text'>,
index_filterable=True,
index_range_filters=False,
index_searchable=True,
nested_properties=None,
tokenization=<Tokenization.WORD: 'word'>,
vectorizer_config=_PropertyVectorizerConfig(skip=False,
vectorize_property_name=False),
vectorizer='text2vec-openai'),
_Property(name='risk_warnings',
description=None,
data_type=<DataType.TEXT: 'text'>,
index_filterable=True,
index_range_filters=False,
index_searchable=True,
nested_properties=None,
tokenization=<Tokenization.WORD: 'word'>,
vectorizer_config=_PropertyVectorizerConfig(skip=False,
vectorize_property_name=False),
vectorizer='text2vec-openai'),
_Property(name='integration_points',
description=None,
data_type=<DataType.TEXT: 'text'>,
index_filterable=True,
index_range_filters=False,
index_searchable=True,
nested_properties=None,
tokenization=<Tokenization.WORD: 'word'>,
vectorizer_config=_PropertyVectorizerConfig(skip=False,
vectorize_property_name=False),
vectorizer='text2vec-openai'),
_Property(name='change_impact',
description=None,
data_type=<DataType.TEXT: 'text'>,
index_filterable=True,
index_range_filters=False,
index_searchable=True,
nested_properties=None,
tokenization=<Tokenization.WORD: 'word'>,
vectorizer_config=_PropertyVectorizerConfig(skip=False,
vectorize_property_name=False),
vectorizer='text2vec-openai'),
_Property(name='kpi',
description=None,
data_type=<DataType.TEXT: 'text'>,
index_filterable=True,
index_range_filters=False,
index_searchable=True,
nested_properties=None,
tokenization=<Tokenization.WORD: 'word'>,
vectorizer_config=_PropertyVectorizerConfig(skip=False,
vectorize_property_name=False),
vectorizer='text2vec-openai'),
_Property(name='business_insights',
description=None,
data_type=<DataType.TEXT: 'text'>,
index_filterable=True,
index_range_filters=False,
index_searchable=True,
nested_properties=None,
tokenization=<Tokenization.WORD: 'word'>,
vectorizer_config=_PropertyVectorizerConfig(skip=False,
vectorize_property_name=False),
vectorizer='text2vec-openai'),
_Property(name='diagnostic_questions',
description=None,
data_type=<DataType.TEXT: 'text'>,
index_filterable=True,
index_range_filters=False,
index_searchable=True,
nested_properties=None,
tokenization=<Tokenization.WORD: 'word'>,
vectorizer_config=_PropertyVectorizerConfig(skip=False,
vectorize_property_name=False),
vectorizer='text2vec-openai'),
_Property(name='meta_info',
description=None,
data_type=<DataType.TEXT_ARRAY: 'text[]'>,
index_filterable=True,
index_range_filters=False,
index_searchable=True,
nested_properties=None,
tokenization=<Tokenization.WORD: 'word'>,
vectorizer_config=_PropertyVectorizerConfig(skip=False,
vectorize_property_name=False),
vectorizer='text2vec-openai'),
_Property(name='child_url',
description=None,
data_type=<DataType.TEXT_ARRAY: 'text[]'>,
index_filterable=True,
index_range_filters=False,
index_searchable=True,
nested_properties=None,
tokenization=<Tokenization.WORD: 'word'>,
vectorizer_config=_PropertyVectorizerConfig(skip=False,
vectorize_property_name=False),
vectorizer='text2vec-openai'),
_Property(name='youtube_url',
description=None,
data_type=<DataType.TEXT: 'text'>,
index_filterable=True,
index_range_filters=False,
index_searchable=True,
nested_properties=None,
tokenization=<Tokenization.WORD: 'word'>,
vectorizer_config=_PropertyVectorizerConfig(skip=False,
vectorize_property_name=False),
vectorizer='text2vec-openai'),
_Property(name='title',
description=None,
data_type=<DataType.TEXT: 'text'>,
index_filterable=True,
index_range_filters=False,
index_searchable=True,
nested_properties=None,
tokenization=<Tokenization.WORD: 'word'>,
vectorizer_config=_PropertyVectorizerConfig(skip=False,
vectorize_property_name=False),
vectorizer='text2vec-openai'),
_Property(name='page_url',
description=None,
data_type=<DataType.TEXT: 'text'>,
index_filterable=True,
index_range_filters=False,
index_searchable=True,
nested_properties=None,
tokenization=<Tokenization.WORD: 'word'>,
vectorizer_config=_PropertyVectorizerConfig(skip=False,
vectorize_property_name=False),
vectorizer='text2vec-openai'),
_Property(name='source_tag__metadatat__metadata',
description=None,
data_type=<DataType.TEXT: 'text'>,
index_filterable=True,
index_range_filters=False,
index_searchable=True,
nested_properties=None,
tokenization=<Tokenization.FIELD: 'field'>,
vectorizer_config=_PropertyVectorizerConfig(skip=False,
vectorize_property_name=False),
vectorizer='text2vec-openai'),
_Property(name='organization_name__metadata',
description='This property was '
"generated by Weaviate's "
'auto-schema feature on '
'Thu Dec 12 06:19:46 2024',
data_type=<DataType.TEXT: 'text'>,
index_filterable=True,
index_range_filters=False,
index_searchable=True,
nested_properties=None,
tokenization=<Tokenization.WORD: 'word'>,
vectorizer_config=_PropertyVectorizerConfig(skip=False,
vectorize_property_name=False),
vectorizer='text2vec-openai'),
_Property(name='data_period__metadata',
description='This property was '
"generated by Weaviate's "
'auto-schema feature on '
'Tue Dec 31 12:05:58 2024',
data_type=<DataType.TEXT: 'text'>,
index_filterable=True,
index_range_filters=False,
index_searchable=True,
nested_properties=None,
tokenization=<Tokenization.WORD: 'word'>,
vectorizer_config=_PropertyVectorizerConfig(skip=False,
vectorize_property_name=False),
vectorizer='text2vec-openai')],
references=[],
replication_config=_ReplicationConfig(factor=1,
async_enabled=False,
deletion_strategy=<ReplicationDeletionStrategy.NO_AUTOMATED_RESOLUTION: 'NoAutomatedResolution'>),
reranker_config=_RerankerConfig(model={},
reranker=<Rerankers.TRANSFORMERS: 'reranker-transformers'>),
sharding_config=_ShardingConfig(virtual_per_physical=128,
desired_count=1,
actual_count=1,
desired_virtual_count=128,
actual_virtual_count=128,
key='_id',
strategy='hash',
function='murmur3'),
vector_index_config=_VectorIndexConfigHNSW(quantizer=None,
cleanup_interval_seconds=300,
distance_metric=<VectorDistances.COSINE: 'cosine'>,
dynamic_ef_min=100,
dynamic_ef_max=500,
dynamic_ef_factor=8,
ef=-1,
ef_construction=128,
filter_strategy=<VectorFilterStrategy.SWEEPING: 'sweeping'>,
flat_search_cutoff=40000,
max_connections=64,
skip=False,
vector_cache_max_objects=1000000000000),
vector_index_type=<VectorIndexType.HNSW: 'hnsw'>,
vectorizer_config=_VectorizerConfig(vectorizer=<Vectorizers.TEXT2VEC_OPENAI: 'text2vec-openai'>,
model={'baseURL': 'https://rampp-openai-azure-api.openai.azure.com/',
'deploymentId': 'text-embedding-3-small',
'model': 'ada',
'resourceName': 'text-embedding-3-small'},
vectorize_collection_name=False),
vectorizer=<Vectorizers.TEXT2VEC_OPENAI: 'text2vec-openai'>,
vector_config=None)
Query:
docs = Kip_vid_documents_azure.query.hybrid(
query="What was the revenue of our company",
alpha=0.7,
limit=100,
)
Error:
WeaviateQueryError: Query call with protocol GRPC search failed with message <AioRpcError of RPC that terminated with:
status = StatusCode.UNKNOWN
details = "remote client vectorize: API Key: no api key found neither in request header: X-Openai-Api-Key nor in environment variable under OPENAI_APIKEY"
debug_error_string = "UNKNOWN:Error received from peer {grpc_message:"remote client vectorize: API Key: no api key found neither in request header: X-Openai-Api-Key nor in environment variable under OPENAI_APIKEY", grpc_status:2, created_time:"2025-01-06T11:06:12.96562467+05:30"}"
>.