import src.constants.credentials as cred import os service_mxbai_msc_direct_config = {"reader_config": {"input_path": os.environ['msc_direct_s3_path'], "credentials": cred.credentials_backblaze, "format":"parquet" }, "sample_size": 32, "sentence_transformer_name": "mixedbread-ai/mxbai-embed-large-v1", "cross_encoder_name": "mixedbread-ai/mxbai-rerank-large-v1", "batch_size": 4, "dataset_size": 32, "seq_len": 256, "top_k": 50, "semantic_column_names": ['name', 'price', 'brand', 'keyword', 'description', 'specifications'], "programmatic_search_config": { "scalar_columns": [{"column_name": "price", "min_value": 0, "max_value": "10000"}], "discrete_columns": [{"column_name": "brand", "default_values": []}], "columns_to_drop": ["similarities", "embeddings", "index"] } }